{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 66,
   "id": "8db54f91-d2ba-4aa3-84b1-95e8c26cdd51",
   "metadata": {
    "tags": []
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "[2023/08/30 14:47:19] ppocr DEBUG: Namespace(help='==SUPPRESS==', use_gpu=False, use_xpu=False, use_npu=False, ir_optim=True, use_tensorrt=False, min_subgraph_size=15, precision='fp32', gpu_mem=500, gpu_id=0, image_dir=None, page_num=0, det_algorithm='DB', det_model_dir='/home/lyz/.paddleocr/whl/det/ch/ch_PP-OCRv4_det_infer', det_limit_side_len=960, det_limit_type='max', det_box_type='quad', det_db_thresh=0.3, det_db_box_thresh=0.6, det_db_unclip_ratio=1.5, max_batch_size=10, use_dilation=False, det_db_score_mode='fast', det_east_score_thresh=0.8, det_east_cover_thresh=0.1, det_east_nms_thresh=0.2, det_sast_score_thresh=0.5, det_sast_nms_thresh=0.2, det_pse_thresh=0, det_pse_box_thresh=0.85, det_pse_min_area=16, det_pse_scale=1, scales=[8, 16, 32], alpha=1.0, beta=1.0, fourier_degree=5, rec_algorithm='SVTR_LCNet', rec_model_dir='/home/lyz/.paddleocr/whl/rec/ch/ch_PP-OCRv4_rec_infer', rec_image_inverse=True, rec_image_shape='3, 48, 320', rec_batch_num=6, max_text_length=25, rec_char_dict_path='/home/lyz/.local/lib/python3.9/site-packages/paddleocr/ppocr/utils/ppocr_keys_v1.txt', use_space_char=True, vis_font_path='./doc/fonts/simfang.ttf', drop_score=0.5, e2e_algorithm='PGNet', e2e_model_dir=None, e2e_limit_side_len=768, e2e_limit_type='max', e2e_pgnet_score_thresh=0.5, e2e_char_dict_path='./ppocr/utils/ic15_dict.txt', e2e_pgnet_valid_set='totaltext', e2e_pgnet_mode='fast', use_angle_cls=True, cls_model_dir='/home/lyz/.paddleocr/whl/cls/ch_ppocr_mobile_v2.0_cls_infer', cls_image_shape='3, 48, 192', label_list=['0', '180'], cls_batch_num=6, cls_thresh=0.9, enable_mkldnn=False, cpu_threads=10, use_pdserving=False, warmup=False, sr_model_dir=None, sr_image_shape='3, 32, 128', sr_batch_num=1, draw_img_save_dir='./inference_results', save_crop_res=False, crop_res_save_dir='./output', use_mp=False, total_process_num=1, process_id=0, benchmark=False, save_log_path='./log_output/', show_log=True, use_onnx=False, return_word_box=False, output='./output', table_max_len=488, table_algorithm='TableAttn', table_model_dir=None, merge_no_span_structure=True, table_char_dict_path=None, layout_model_dir=None, layout_dict_path=None, layout_score_threshold=0.5, layout_nms_threshold=0.5, kie_algorithm='LayoutXLM', ser_model_dir=None, re_model_dir=None, use_visual_backbone=True, ser_dict_path='../train_data/XFUND/class_list_xfun.txt', ocr_order_method=None, mode='structure', image_orientation=False, layout=True, table=True, ocr=True, recovery=False, use_pdf2docx_api=False, lang='ch', det=True, rec=True, type='ocr', ocr_version='PP-OCRv4', structure_version='PP-StructureV2')\n"
     ]
    }
   ],
   "source": [
    "import glob\n",
    "from pdf2image import convert_from_path\n",
    "import pandas as pd\n",
    "import requests\n",
    "from io import StringIO\n",
    "\n",
    "train_pdf = glob.glob('./标书实体抽取挑战赛公开数据/train/pdf/*')\n",
    "train_label = glob.glob('./标书实体抽取挑战赛公开数据/train/label/*')\n",
    "\n",
    "train_pdf.sort()\n",
    "train_label.sort()\n",
    "\n",
    "test_pdf = glob.glob('./标书实体抽取挑战赛公开数据/test/pdf/*')\n",
    "test_label = glob.glob('./标书实体抽取挑战赛测试集要素名称/*')\n",
    "\n",
    "test_pdf.sort()\n",
    "test_label.sort()\n",
    "\n",
    "from paddleocr import PaddleOCR, draw_ocr\n",
    "ocr = PaddleOCR(use_angle_cls=True, lang=\"ch\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 100,
   "id": "53eac8ae-87c8-4dbf-8810-89338e74eabe",
   "metadata": {
    "tags": []
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "[2023/08/30 15:46:16] ppocr DEBUG: dt_boxes num : 10, elapse : 0.5190646648406982\n",
      "[2023/08/30 15:46:16] ppocr DEBUG: cls num  : 10, elapse : 0.05770516395568848\n",
      "[2023/08/30 15:46:17] ppocr DEBUG: rec_res num  : 10, elapse : 1.3793835639953613\n",
      "[2023/08/30 15:46:18] ppocr DEBUG: dt_boxes num : 16, elapse : 0.4673466682434082\n",
      "[2023/08/30 15:46:18] ppocr DEBUG: cls num  : 16, elapse : 0.08149027824401855\n",
      "[2023/08/30 15:46:19] ppocr DEBUG: rec_res num  : 16, elapse : 1.5296516418457031\n",
      "[2023/08/30 15:46:20] ppocr DEBUG: dt_boxes num : 36, elapse : 0.49208545684814453\n",
      "[2023/08/30 15:46:20] ppocr DEBUG: cls num  : 36, elapse : 0.18323349952697754\n",
      "[2023/08/30 15:46:24] ppocr DEBUG: rec_res num  : 36, elapse : 3.9673149585723877\n",
      "./标书实体抽取挑战赛公开数据/test/pdf/CT201011166974-信科集团-支出类-物资购销合同-40页扫描件.pdf\n",
      "|    | 要素名称                     | 要素点   |\n",
      "|---:|:-----------------------------|:---------|\n",
      "|  0 | 发票税率                     |          |\n",
      "|  1 | 负责人签名                   |          |\n",
      "|  2 | 合同尾部_受托方_受托方名称值 |          |\n",
      "|  3 | 合同总金额(大写)             |          |\n",
      "|  4 | 支付方式                     |          |\n",
      "|  5 | 支付比例                     |          |\n",
      "|  6 | 合同首部_受托方_受托方名称值 |          |\n",
      "[2023/08/30 15:46:46] ppocr DEBUG: dt_boxes num : 14, elapse : 0.5264196395874023\n",
      "[2023/08/30 15:46:46] ppocr DEBUG: cls num  : 14, elapse : 0.07978129386901855\n",
      "[2023/08/30 15:46:48] ppocr DEBUG: rec_res num  : 14, elapse : 1.7427315711975098\n",
      "[2023/08/30 15:46:48] ppocr DEBUG: dt_boxes num : 31, elapse : 0.49687814712524414\n",
      "[2023/08/30 15:46:48] ppocr DEBUG: cls num  : 31, elapse : 0.16832447052001953\n",
      "[2023/08/30 15:46:54] ppocr DEBUG: rec_res num  : 31, elapse : 6.04237961769104\n",
      "[2023/08/30 15:46:55] ppocr DEBUG: dt_boxes num : 29, elapse : 0.5010638236999512\n",
      "[2023/08/30 15:46:55] ppocr DEBUG: cls num  : 29, elapse : 0.14826130867004395\n",
      "[2023/08/30 15:46:57] ppocr DEBUG: rec_res num  : 29, elapse : 2.2781968116760254\n",
      "./标书实体抽取挑战赛公开数据/test/pdf/CT201110576783-一公院-支出类-设计合同-7页扫描件.pdf\n",
      "|    | 要素名称                         | 要素点   |\n",
      "|---:|:---------------------------------|:---------|\n",
      "|  0 | 合同尾部_卖方信息_名称           |          |\n",
      "|  1 | 小写金额                         |          |\n",
      "|  2 | 支付时间及方式_支付方式_支付条件 |          |\n",
      "|  3 | 合同首部_卖方信息_名称           |          |\n",
      "|  4 | 支付时间及方式_支付方式_支付比例 |          |\n",
      "|  5 | 收款方银行信息_银行账号          |          |\n",
      "|  6 | 合同首部_买方信息_名称           |          |\n",
      "|  7 | 交货_交货地点                    |          |\n",
      "[2023/08/30 15:47:22] ppocr DEBUG: dt_boxes num : 12, elapse : 0.5232574939727783\n",
      "[2023/08/30 15:47:22] ppocr DEBUG: cls num  : 12, elapse : 0.06933975219726562\n",
      "[2023/08/30 15:47:24] ppocr DEBUG: rec_res num  : 12, elapse : 1.611480712890625\n",
      "[2023/08/30 15:47:24] ppocr DEBUG: dt_boxes num : 35, elapse : 0.49165868759155273\n",
      "[2023/08/30 15:47:25] ppocr DEBUG: cls num  : 35, elapse : 0.17900848388671875\n",
      "[2023/08/30 15:47:32] ppocr DEBUG: rec_res num  : 35, elapse : 7.670945644378662\n",
      "[2023/08/30 15:47:33] ppocr DEBUG: dt_boxes num : 22, elapse : 0.4893839359283447\n",
      "[2023/08/30 15:47:33] ppocr DEBUG: cls num  : 22, elapse : 0.11380910873413086\n",
      "[2023/08/30 15:47:36] ppocr DEBUG: rec_res num  : 22, elapse : 3.065817356109619\n",
      "./标书实体抽取挑战赛公开数据/test/pdf/CT201110704238-一公院-支出类-设备 (含船机)购销合同-7页扫描件.pdf\n",
      "|    | 要素名称               | 要素点       |\n",
      "|---:|:-----------------------|:-------------|\n",
      "|  0 | 合同正文_签订日期值    |              |\n",
      "|  1 | 合同正文_合同签订地    |              |\n",
      "|  2 | 合同首部_卖方信息_名称 |              |\n",
      "|  3 | 合同首部_买方信息_名称 |              |\n",
      "|  4 | 型号                   | SIGA-PSIC   |\n",
      "|  5 | 工作电压               | DC18V~DC30V |\n",
      "|  6 | 监视电流               | ≤50μA       |\n",
      "|  7 | 报警电流               | ≤50A        |\n",
      "|  8 | 环境温度               | -20℃～60℃ |\n",
      "|  9 | 环境湿度               | 10%～95%RH |\n",
      "| 10 | 相对湿度               | ≤95%        |\n",
      "| 11 | 保护面积               | ≥20㎡²      |\n",
      "| 12 | 声音报警输出           | 94dBA～98dBA |\n",
      "| 13 | 光报警输出             | 15cd或75cd  |\n",
      "| 14 | 声音报警工作电流       | 40mA        |\n",
      "| 15 | 声音报警工作电压       | 24VDC       |\n",
      "| 16 | 声光报警控制模块       | 具备CPU和智能控制算法和数字通讯技术 |\n",
      "| 17 | 继电器输出             | 1组（双刀双掷） |\n",
      "| 18 | 编码地址               | 占一个编码地址 |\n",
      "[2023/08/30 15:48:13] ppocr DEBUG: dt_boxes num : 25, elapse : 0.5230522155761719\n",
      "[2023/08/30 15:48:13] ppocr DEBUG: cls num  : 25, elapse : 0.12953448295593262\n",
      "[2023/08/30 15:48:16] ppocr DEBUG: rec_res num  : 25, elapse : 2.5115034580230713\n",
      "[2023/08/30 15:48:16] ppocr DEBUG: dt_boxes num : 27, elapse : 0.5010063648223877\n",
      "[2023/08/30 15:48:17] ppocr DEBUG: cls num  : 27, elapse : 0.14365243911743164\n",
      "[2023/08/30 15:48:21] ppocr DEBUG: rec_res num  : 27, elapse : 4.861526966094971\n",
      "[2023/08/30 15:48:22] ppocr DEBUG: dt_boxes num : 43, elapse : 0.4972250461578369\n",
      "[2023/08/30 15:48:22] ppocr DEBUG: cls num  : 43, elapse : 0.22463321685791016\n",
      "[2023/08/30 15:48:26] ppocr DEBUG: rec_res num  : 43, elapse : 3.6099257469177246\n",
      "./标书实体抽取挑战赛公开数据/test/pdf/CT201111215740-民航机场建设集团-支出类-设计合同-8页扫描件.pdf\n",
      "|    | 要素名称                         | 要素点                         |\n",
      "|---:|:---------------------------------|:-------------------------------|\n",
      "|  0 | 合同标的_用途_标的物用途         | 建设工程设计合同               |\n",
      "|  1 | 合同标的额大写                   | 无                             |\n",
      "|  2 | 支付时间及方式_支付方式_支付金额 | $2                            |\n",
      "|  3 | 合同首部_买方信息_名称           | 上海民航新时代机场设计研究院有限公司 |\n",
      "|  4 | 支付时间及方式_支付方式_支付条件 | 无                             |\n",
      "|    | 要素名称                         | 要素点                         |\n",
      "|---:|:---------------------------------|:-------------------------------|\n",
      "|  0 | 合同标的_用途_标的物用途         | 重庆江北国际机场实施仪表着陆ⅡI类运行工程 |\n",
      "|  1 | 合同标的额大写                   | 无                             |\n",
      "|  2 | 支付时间及方式_支付方式_支付金额 | 无                             |\n",
      "|  3 | 合同首部_买方信息_名称           | 无                             |\n",
      "|  4 | 支付时间及方式_支付方式_支付条件 | 无                             |\n",
      "[2023/08/30 15:48:55] ppocr DEBUG: dt_boxes num : 9, elapse : 0.5177116394042969\n",
      "[2023/08/30 15:48:55] ppocr DEBUG: cls num  : 9, elapse : 0.062136173248291016\n",
      "[2023/08/30 15:48:57] ppocr DEBUG: rec_res num  : 9, elapse : 1.5002105236053467\n",
      "[2023/08/30 15:48:57] ppocr DEBUG: dt_boxes num : 41, elapse : 0.45052576065063477\n",
      "[2023/08/30 15:48:57] ppocr DEBUG: cls num  : 41, elapse : 0.21105289459228516\n",
      "[2023/08/30 15:49:05] ppocr DEBUG: rec_res num  : 41, elapse : 7.155740737915039\n",
      "[2023/08/30 15:49:05] ppocr DEBUG: dt_boxes num : 17, elapse : 0.4864499568939209\n",
      "[2023/08/30 15:49:05] ppocr DEBUG: cls num  : 17, elapse : 0.08861756324768066\n",
      "[2023/08/30 15:49:08] ppocr DEBUG: rec_res num  : 17, elapse : 2.6273694038391113\n",
      "./标书实体抽取挑战赛公开数据/test/pdf/CT201210212814-一航局-支出类-专业分包合同-30页扫描件.pdf\n",
      "|    | 要素名称               | 要素点            |\n",
      "|---:|:-----------------------|:-----------------|\n",
      "|  0 | 小写金额               | 无               |\n",
      "|  1 | 合同正文_合同签订地    | 连云港海滨新城金海一期 |\n",
      "|  2 | 合同首部_卖方信息_名称 | 中交一航局二公司 |\n",
      "[2023/08/30 15:49:25] ppocr DEBUG: dt_boxes num : 62, elapse : 0.5467269420623779\n",
      "[2023/08/30 15:49:25] ppocr DEBUG: cls num  : 62, elapse : 0.3280024528503418\n",
      "[2023/08/30 15:49:30] ppocr DEBUG: rec_res num  : 62, elapse : 5.0752177238464355\n",
      "[2023/08/30 15:49:31] ppocr DEBUG: dt_boxes num : 16, elapse : 0.48941636085510254\n",
      "[2023/08/30 15:49:31] ppocr DEBUG: cls num  : 16, elapse : 0.08768725395202637\n",
      "[2023/08/30 15:49:32] ppocr DEBUG: rec_res num  : 16, elapse : 1.659189224243164\n",
      "[2023/08/30 15:49:33] ppocr DEBUG: dt_boxes num : 57, elapse : 0.5056557655334473\n",
      "[2023/08/30 15:49:33] ppocr DEBUG: cls num  : 57, elapse : 0.29448413848876953\n",
      "[2023/08/30 15:49:38] ppocr DEBUG: rec_res num  : 57, elapse : 4.522216558456421\n",
      "./标书实体抽取挑战赛公开数据/test/pdf/CT201210455567-一航局-支出类-设备 (含船机)购销合同-8页扫描件.pdf\n",
      "| 合同名称   | 东营港经济开发区防潮堤 |\n",
      "| 项目名称   | 赁分包合同 |\n",
      "| 工程施工一标 | 无 |\n",
      "| 合同送签单位 | 鲁能项目部 |\n",
      "| 送签日期   | 2012/5/11 |\n",
      "| 主要合同条款 | 分包方：青岛翰德源工程机械和赁行限公司  工期：即自承租方下达开工令之11起至2012年11月30门  分包内容：机械租赁  价款：据实结算 |\n",
      "| 审核部门   | 工程管理部 |\n",
      "| 审核意见   | 偏高 |\n",
      "| 签字     | 刘太洲 |\n",
      "| 日期     | 2012.5.17 |\n",
      "| 落实     | 同意调整后价 |\n",
      "| 其他     | 部分设备台班费和月租费 |\n",
      "| 审核部门   | 企业发展部 |\n",
      "| 审核意见   | 单价均偏高 |\n",
      "| 签字     | 无 |\n",
      "| 日期     | 12.5.17 |\n",
      "| 落实     | 同意调整后租价（合同清单相应更换） |\n",
      "| 审核部门   | 安全监督部 |\n",
      "| 审核意见   | 同意 |\n",
      "| 签字     | 范缺强 |\n",
      "| 日期     | 2012.5.17 |\n",
      "| 落实     | 同意调整后价格 |\n",
      "| 其他     | 装载机、挖掘机、洒水车租赁 |\n",
      "| 审核部门   | 装备部 |\n",
      "| 审核意见   | 装载机、挖掘机洒水车租价偏高 |\n",
      "| 签字     | 无 |\n",
      "| 日期     | 2012.5.17 |\n",
      "| 落实     | 无 |\n",
      "| 审核部门   | 财务部 |\n",
      "| 审核意见   | 无 |\n",
      "| 签字     | 无 |\n",
      "| 日期     | 无 |\n",
      "| 落实     | 无 |\n",
      "| 同意       | 无       |\n",
      "| 12.5.18    | 无       |\n",
      "| 法律事务部 | 无       |\n",
      "| 同意       | 无       |\n",
      "| 所键       | 无       |\n",
      "| 12.5.18    | 无       |\n",
      "| 工管理部长 | 无       |\n",
      "| 同意       | 无       |\n",
      "| 托不久     | 无       |\n",
      "| 20120526   | 无       |\n",
      "| 分管副总   | 无       |\n",
      "| 同意       | 无       |\n",
      "| 2012-5-28  | 无       |\n",
      "| 公司总经理 | 无       |\n",
      "| 2012-6-2  | 无       |\n",
      "| 同意       | 无       |\n",
      "| 车辆类型   | 履带式单斗液压330长臂挖掘机 |\n",
      "| 单价（元） | 1700 |\n",
      "| 数量（台） | 50000 |\n",
      "| 车辆类型   | 履带式单斗液压120挖掘机 |\n",
      "| 单价（元） | 3000 |\n",
      "| 数量（台） | 75000 |\n",
      "| 车辆类型   | 履带式单斗液压230挖掘机 |\n",
      "| 单价（元） | 1000 |\n",
      "| 数量（台） | 30000 |\n",
      "| 车辆类型   | 自卸汽车载重量30T |\n",
      "| 单价（元） | 1500 |\n",
      "| 数量（台） | 36000 |\n",
      "| 车辆类型   | 18T光轮压路机 |\n",
      "| 单价（元） | 1200 |\n",
      "| 数量（台） | 27000 |\n",
      "| 车辆类型   | 东风平头10方洒水车 |\n",
      "| 单价（元） | 900 |\n",
      "| 数量（台） | 25000 |\n",
      "[2023/08/30 15:50:45] ppocr DEBUG: dt_boxes num : 14, elapse : 0.5283045768737793\n",
      "[2023/08/30 15:50:45] ppocr DEBUG: cls num  : 14, elapse : 0.07892060279846191\n",
      "[2023/08/30 15:50:47] ppocr DEBUG: rec_res num  : 14, elapse : 1.8194806575775146\n",
      "[2023/08/30 15:50:47] ppocr DEBUG: dt_boxes num : 35, elapse : 0.49503302574157715\n",
      "[2023/08/30 15:50:48] ppocr DEBUG: cls num  : 35, elapse : 0.17880558967590332\n",
      "[2023/08/30 15:50:55] ppocr DEBUG: rec_res num  : 35, elapse : 7.802832126617432\n",
      "[2023/08/30 15:50:56] ppocr DEBUG: dt_boxes num : 94, elapse : 0.5128910541534424\n",
      "[2023/08/30 15:50:56] ppocr DEBUG: cls num  : 94, elapse : 0.4711289405822754\n",
      "[2023/08/30 15:51:04] ppocr DEBUG: rec_res num  : 94, elapse : 8.031973838806152\n",
      "./标书实体抽取挑战赛公开数据/test/pdf/CT201210917910-一公局-支出类-专业分包合同-15页扫描件.pdf\n",
      "|    | 要素名称               | 要素点   |\n",
      "|---:|:-----------------------|:---------|\n",
      "|  0 | 合同标的额小写         | 2       |\n",
      "|  1 | 合同首部_卖方信息_名称 | 乙方     |\n",
      "|  2 | 合同标的额大写         | 无       |\n",
      "|  3 | 生效_生效时间          | 2012.4.1|\n",
      "|  4 | 率或                    | 间       |\n",
      "|  5 | 计                      | 有       |\n",
      "|  6 | 购                      | 要求     |\n",
      "|  7 | 容量                    |          |\n",
      "|  8 | 挖掘机                  | 1M3     |\n",
      "|  9 |                      | 2       |\n",
      "| 10 |                      | 2       |\n",
      "| 11 |                      | 80%     |\n",
      "| 12 |                      | 1       |\n",
      "| 13 |                      | 2012.4.1|\n",
      "| 14 |                      | 2       |\n",
      "| 15 | 装载机                  | 3M3     |\n",
      "| 16 |                      | 2       |\n",
      "| 17 |                      | 2       |\n",
      "| 18 |                      | 80%     |\n",
      "| 19 |                      | 2012.4.1|\n",
      "| 20 |                      | 3       |\n",
      "| 21 | 起重机                  | 8T      |\n",
      "| 22 |                      | 2       |\n",
      "| 23 |                      | 2       |\n",
      "| 24 |                      | 80%     |\n",
      "| 25 |                      | 2012.4.1|\n",
      "| 26 |                      | 4       |\n",
      "| 27 | 运输车辆                | 12T     |\n",
      "| 28 |                      | 8       |\n",
      "| 29 |                      | 8       |\n",
      "| 30 |                      | 80%     |\n",
      "| 31 |                      | 2012.4.1|\n",
      "| 32 | 合计                    | 15-     |\n",
      "| 33 | 甲方                    |          |\n",
      "| 34 | 乙方                    |          |\n",
      "[2023/08/30 15:52:18] ppocr DEBUG: dt_boxes num : 19, elapse : 0.5273449420928955\n",
      "[2023/08/30 15:52:18] ppocr DEBUG: cls num  : 19, elapse : 0.10464739799499512\n",
      "[2023/08/30 15:52:20] ppocr DEBUG: rec_res num  : 19, elapse : 2.041266918182373\n",
      "[2023/08/30 15:52:21] ppocr DEBUG: dt_boxes num : 34, elapse : 0.4953930377960205\n",
      "[2023/08/30 15:52:21] ppocr DEBUG: cls num  : 34, elapse : 0.1824944019317627\n",
      "[2023/08/30 15:52:28] ppocr DEBUG: rec_res num  : 34, elapse : 7.1062774658203125\n",
      "[2023/08/30 15:52:29] ppocr DEBUG: dt_boxes num : 16, elapse : 0.4953882694244385\n",
      "[2023/08/30 15:52:29] ppocr DEBUG: cls num  : 16, elapse : 0.0865333080291748\n",
      "[2023/08/30 15:52:30] ppocr DEBUG: rec_res num  : 16, elapse : 1.3741753101348877\n",
      "./标书实体抽取挑战赛公开数据/test/pdf/CT201210918007-一公局-支出类-专业分包合同-26页扫描件.pdf\n",
      "|    | 要素名称                     | 要素点   |\n",
      "|---:|:-----------------------------|:---------|\n",
      "|  0 | 合同标的额小写               |          |\n",
      "|  1 | 合同首部_卖方信息_名称       |          |\n",
      "|  2 | 售后服务_质保_质保期起算时间 |          |\n",
      "|  3 | 合同首部_买方信息_名称       |          |\n",
      "|  4 | 大写金额                     |          |\n",
      "[2023/08/30 15:52:49] ppocr DEBUG: dt_boxes num : 66, elapse : 0.5436558723449707\n",
      "[2023/08/30 15:52:49] ppocr DEBUG: cls num  : 66, elapse : 0.33405399322509766\n",
      "[2023/08/30 15:52:56] ppocr DEBUG: rec_res num  : 66, elapse : 7.083620548248291\n",
      "[2023/08/30 15:52:57] ppocr DEBUG: dt_boxes num : 36, elapse : 0.5084640979766846\n",
      "[2023/08/30 15:52:57] ppocr DEBUG: cls num  : 36, elapse : 0.18987703323364258\n",
      "[2023/08/30 15:53:06] ppocr DEBUG: rec_res num  : 36, elapse : 8.570513486862183\n",
      "[2023/08/30 15:53:06] ppocr DEBUG: dt_boxes num : 2, elapse : 0.5002560615539551\n",
      "[2023/08/30 15:53:06] ppocr DEBUG: cls num  : 2, elapse : 0.017423152923583984\n",
      "[2023/08/30 15:53:06] ppocr DEBUG: rec_res num  : 2, elapse : 0.2510182857513428\n",
      "./标书实体抽取挑战赛公开数据/test/pdf/CT201210928685-三公局-支出类-物资购销合同-4页扫描件.pdf\n",
      "|    | 要素名称               | 要素点       |\n",
      "|---:|:-----------------------|:-------------|\n",
      "|  0 | 合同正文_合同签订地    | 铜仁市玉屏县大龙镇 |\n",
      "|  1 | 合同首部_买方信息_名称 | 中交第三公路工程局有限公司铜仁至大龙 |\n",
      "\n",
      "|    | 要素名称               | 要素点   |\n",
      "|---:|:-----------------------|:---------|\n",
      "|  0 | 合同正文_合同签订地    | 无       |\n",
      "|  1 | 合同首部_买方信息_名称 | 无       |\n",
      "\n",
      "|    | 要素名称               | 要素点        |\n",
      "|---:|:-----------------------|:--------------|\n",
      "|  0 | 合同正文_合同签订地    | 贵州省农村信用社联合社 |\n",
      "|  1 | 合同首部_买方信息_名称 | 无                |\n",
      "\n",
      "|    | 要素名称               | 要素点   |\n",
      "|---:|:-----------------------|:---------|\n",
      "|  0 | 合同正文_合同签订地    |          |\n",
      "|  1 | 合同首部_买方信息_名称 |          |\n",
      "[2023/08/30 15:53:49] ppocr DEBUG: dt_boxes num : 6, elapse : 0.5288732051849365\n",
      "[2023/08/30 15:53:49] ppocr DEBUG: cls num  : 6, elapse : 0.03900313377380371\n",
      "[2023/08/30 15:53:51] ppocr DEBUG: rec_res num  : 6, elapse : 1.4244978427886963\n",
      "[2023/08/30 15:53:51] ppocr DEBUG: dt_boxes num : 29, elapse : 0.4981510639190674\n",
      "[2023/08/30 15:53:52] ppocr DEBUG: cls num  : 29, elapse : 0.15446877479553223\n",
      "[2023/08/30 15:53:59] ppocr DEBUG: rec_res num  : 29, elapse : 7.74037504196167\n",
      "[2023/08/30 15:54:00] ppocr DEBUG: dt_boxes num : 37, elapse : 0.49834656715393066\n",
      "[2023/08/30 15:54:00] ppocr DEBUG: cls num  : 37, elapse : 0.18933725357055664\n",
      "[2023/08/30 15:54:05] ppocr DEBUG: rec_res num  : 37, elapse : 4.605646848678589\n",
      "./标书实体抽取挑战赛公开数据/test/pdf/CT201211133943-一航局-支出类-设备 (含船机)购销合同-28页扫描件.pdf\n",
      "|    | 要素名称               | 要素点   |\n",
      "|---:|:-----------------------|:---------|\n",
      "|  0 | 合同标的额大写         |          |\n",
      "|  1 | 开票_发票_发票类型     |          |\n",
      "|  2 | 合同首部_卖方信息_名称 |          |\n",
      "|  3 | 合同标的额小写         |          |\n",
      "|  4 | 合同首部_买方信息_名称 |          |\n",
      "[2023/08/30 15:54:28] ppocr DEBUG: dt_boxes num : 39, elapse : 0.5309183597564697\n",
      "[2023/08/30 15:54:29] ppocr DEBUG: cls num  : 39, elapse : 0.21010875701904297\n",
      "[2023/08/30 15:54:36] ppocr DEBUG: rec_res num  : 39, elapse : 7.895054340362549\n",
      "[2023/08/30 15:54:37] ppocr DEBUG: dt_boxes num : 40, elapse : 0.49418044090270996\n",
      "[2023/08/30 15:54:37] ppocr DEBUG: cls num  : 40, elapse : 0.2026991844177246\n",
      "[2023/08/30 15:54:46] ppocr DEBUG: rec_res num  : 40, elapse : 8.359474420547485\n",
      "[2023/08/30 15:54:46] ppocr DEBUG: dt_boxes num : 1, elapse : 0.4775364398956299\n",
      "[2023/08/30 15:54:46] ppocr DEBUG: cls num  : 1, elapse : 0.011125564575195312\n",
      "[2023/08/30 15:54:46] ppocr DEBUG: rec_res num  : 1, elapse : 0.06939005851745605\n",
      "./标书实体抽取挑战赛公开数据/test/pdf/CT201310177080-一航局-支出类-劳务分包合同-28页扫描件.pdf\n",
      "|    | 要素名称                             | 要素点   |\n",
      "|---:|:-------------------------------------|:---------|\n",
      "|  0 | 合同标的额小写                       |          |\n",
      "|  1 | 大写金额                             |          |\n",
      "|  2 | 支付时间及方式_支付方式_支付时间期限 |          |\n",
      "[2023/08/30 15:54:59] ppocr DEBUG: dt_boxes num : 43, elapse : 0.5402967929840088\n",
      "[2023/08/30 15:54:59] ppocr DEBUG: cls num  : 43, elapse : 0.21978139877319336\n",
      "[2023/08/30 15:55:10] ppocr DEBUG: rec_res num  : 43, elapse : 10.455554246902466\n",
      "[2023/08/30 15:55:10] ppocr DEBUG: dt_boxes num : 52, elapse : 0.4989280700683594\n",
      "[2023/08/30 15:55:10] ppocr DEBUG: cls num  : 52, elapse : 0.26280975341796875\n",
      "[2023/08/30 15:55:23] ppocr DEBUG: rec_res num  : 52, elapse : 12.439791917800903\n",
      "[2023/08/30 15:55:23] ppocr DEBUG: dt_boxes num : 13, elapse : 0.49282169342041016\n",
      "[2023/08/30 15:55:23] ppocr DEBUG: cls num  : 13, elapse : 0.0714714527130127\n",
      "[2023/08/30 15:55:26] ppocr DEBUG: rec_res num  : 13, elapse : 2.993962526321411\n",
      "./标书实体抽取挑战赛公开数据/test/pdf/CT201310562425-中交建筑-支出类-劳务分包合同-13页扫描件.pdf\n",
      "|    | 要素名称                 | 要素点       |\n",
      "|---:|:-------------------------|:-------------|\n",
      "|  0 | 合同标的_用途_标的物用途 | 哈撒尔街大桥预制梁安装工程 |\n",
      "|  1 | 合同首部_卖方信息_名称   | 中交四公局第三工程有限公司内蒙古四子王旗市政工程项目部 |\n",
      "|  2 | 合同首部_买方信息_名称   | 呼和浩特市锯元工程机械设备租赁有限责任公司 |\n",
      "|  3 | 合同标的_用途_标的物用途 | 安装空心板梁混凝土 |\n",
      "|  4 | 合同首部_卖方信息_名称   | 中交四公局第三工程有限公司内蒙古四子王旗市政工程项目经理部 |\n",
      "|  5 | 合同首部_买方信息_名称   | 无           |\n",
      "|  6 | 合同标的_用途_标的物用途 | 无           |\n",
      "|  7 | 合同首部_卖方信息_名称   | 甲方         |\n",
      "|  8 | 合同首部_买方信息_名称   | 乙方         |\n",
      "[2023/08/30 15:56:01] ppocr DEBUG: dt_boxes num : 35, elapse : 0.5330295562744141\n",
      "[2023/08/30 15:56:01] ppocr DEBUG: cls num  : 35, elapse : 0.18424057960510254\n",
      "[2023/08/30 15:56:07] ppocr DEBUG: rec_res num  : 35, elapse : 6.474583625793457\n",
      "[2023/08/30 15:56:08] ppocr DEBUG: dt_boxes num : 32, elapse : 0.4934697151184082\n",
      "[2023/08/30 15:56:08] ppocr DEBUG: cls num  : 32, elapse : 0.1694502830505371\n",
      "[2023/08/30 15:56:15] ppocr DEBUG: rec_res num  : 32, elapse : 7.078346014022827\n",
      "[2023/08/30 15:56:16] ppocr DEBUG: dt_boxes num : 87, elapse : 0.5215015411376953\n",
      "[2023/08/30 15:56:16] ppocr DEBUG: cls num  : 87, elapse : 0.4449913501739502\n",
      "[2023/08/30 15:56:25] ppocr DEBUG: rec_res num  : 87, elapse : 9.146509647369385\n",
      "./标书实体抽取挑战赛公开数据/test/pdf/CT201310863030-民航机场建设集团-支出类-专业分包合同-23页扫描件.pdf\n",
      "|    | 要素名称                                 | 要素点   |\n",
      "|---:|:-----------------------------------------|:---------|\n",
      "|  0 | 合同尾部_卖方信息_签署日期值             |          |\n",
      "|  1 | 售后服务_履约保证金_履约保证金比例       |          |\n",
      "|  2 | 合同标的额小写                           |          |\n",
      "|  3 | 验收_验收标准                            |          |\n",
      "|  4 | 合同正文_合同签订地                      |          |\n",
      "|  5 | 违约责任_卖方责任_产品不符合约定责任条款 |          |\n",
      "|  6 | 生效_生效条件                            |          |\n",
      "[2023/08/30 15:56:56] ppocr DEBUG: dt_boxes num : 9, elapse : 0.5263745784759521\n",
      "[2023/08/30 15:56:56] ppocr DEBUG: cls num  : 9, elapse : 0.05100584030151367\n",
      "[2023/08/30 15:56:57] ppocr DEBUG: rec_res num  : 9, elapse : 1.0694403648376465\n",
      "[2023/08/30 15:56:57] ppocr DEBUG: dt_boxes num : 34, elapse : 0.5023164749145508\n",
      "[2023/08/30 15:56:58] ppocr DEBUG: cls num  : 34, elapse : 0.17807817459106445\n",
      "[2023/08/30 15:57:04] ppocr DEBUG: rec_res num  : 34, elapse : 6.492086887359619\n",
      "[2023/08/30 15:57:05] ppocr DEBUG: dt_boxes num : 49, elapse : 0.5128629207611084\n",
      "[2023/08/30 15:57:05] ppocr DEBUG: cls num  : 49, elapse : 0.25509071350097656\n",
      "[2023/08/30 15:57:10] ppocr DEBUG: rec_res num  : 49, elapse : 4.489801406860352\n",
      "./标书实体抽取挑战赛公开数据/test/pdf/CT201311207591-中资集团-支出类-设计合同-11页扫描件.pdf\n",
      "|    | 要素名称               | 要素点   |\n",
      "|---:|:-----------------------|:---------|\n",
      "|  0 | 合同正文_签订日期值    |          |\n",
      "|  1 | 合同首部_卖方信息_名称 |          |\n",
      "|  2 | 合同首部_买方信息_名称 |          |\n",
      "[2023/08/30 15:57:25] ppocr DEBUG: dt_boxes num : 44, elapse : 0.5420162677764893\n",
      "[2023/08/30 15:57:25] ppocr DEBUG: cls num  : 44, elapse : 0.2263791561126709\n",
      "[2023/08/30 15:57:29] ppocr DEBUG: rec_res num  : 44, elapse : 3.563417673110962\n",
      "[2023/08/30 15:57:30] ppocr DEBUG: dt_boxes num : 37, elapse : 0.49848365783691406\n",
      "[2023/08/30 15:57:30] ppocr DEBUG: cls num  : 37, elapse : 0.1916346549987793\n",
      "[2023/08/30 15:57:35] ppocr DEBUG: rec_res num  : 37, elapse : 4.875521183013916\n",
      "[2023/08/30 15:57:35] ppocr DEBUG: dt_boxes num : 43, elapse : 0.4961073398590088\n",
      "[2023/08/30 15:57:35] ppocr DEBUG: cls num  : 43, elapse : 0.2196793556213379\n",
      "[2023/08/30 15:57:39] ppocr DEBUG: rec_res num  : 43, elapse : 3.351921558380127\n",
      "./标书实体抽取挑战赛公开数据/test/pdf/CT201311302717-民航机场建设集团-支出类-设计合同-8页扫描件.pdf\n",
      "       【表格最终格式】\n",
      "        |    | 要素名称               | 要素点   |\n",
      "|---:|:-----------------------|:---------|\n",
      "|  0 | 合同正文_签订日期值    |          |\n",
      "|  1 | 合同首部_卖方信息_名称 |          |\n",
      "|  2 | 合同首部_买方信息_名称 |          |\n",
      "[2023/08/30 15:58:06] ppocr DEBUG: dt_boxes num : 7, elapse : 0.5321140289306641\n",
      "[2023/08/30 15:58:06] ppocr DEBUG: cls num  : 7, elapse : 0.043755292892456055\n",
      "[2023/08/30 15:58:07] ppocr DEBUG: rec_res num  : 7, elapse : 0.9242677688598633\n",
      "[2023/08/30 15:58:08] ppocr DEBUG: dt_boxes num : 33, elapse : 0.45591282844543457\n",
      "[2023/08/30 15:58:08] ppocr DEBUG: cls num  : 33, elapse : 0.1690654754638672\n",
      "[2023/08/30 15:58:16] ppocr DEBUG: rec_res num  : 33, elapse : 8.454025030136108\n",
      "[2023/08/30 15:58:17] ppocr DEBUG: dt_boxes num : 1, elapse : 0.48603224754333496\n",
      "[2023/08/30 15:58:17] ppocr DEBUG: cls num  : 1, elapse : 0.013744115829467773\n",
      "[2023/08/30 15:58:17] ppocr DEBUG: rec_res num  : 1, elapse : 0.07100248336791992\n",
      "./标书实体抽取挑战赛公开数据/test/pdf/CT201311324586-中交建筑-支出类-劳务分包合同-33页扫描件.pdf\n",
      "|    | 要素名称                   | 要素点   |\n",
      "|---:|:---------------------------|:---------|\n",
      "|  0 | 合同标的_用途_标的物用途   |          |\n",
      "|  1 | 合同首部_卖方信息_名称     |          |\n",
      "|  2 | 违约责任_卖方责任_责任条款 |          |\n",
      "[2023/08/30 15:59:06] ppocr DEBUG: dt_boxes num : 7, elapse : 0.4555695056915283\n",
      "[2023/08/30 15:59:06] ppocr DEBUG: cls num  : 7, elapse : 0.043213844299316406\n",
      "[2023/08/30 15:59:07] ppocr DEBUG: rec_res num  : 7, elapse : 1.0011024475097656\n",
      "[2023/08/30 15:59:08] ppocr DEBUG: dt_boxes num : 74, elapse : 0.4398219585418701\n",
      "[2023/08/30 15:59:09] ppocr DEBUG: cls num  : 74, elapse : 0.3743002414703369\n",
      "[2023/08/30 15:59:15] ppocr DEBUG: rec_res num  : 74, elapse : 6.03829026222229\n",
      "[2023/08/30 15:59:15] ppocr DEBUG: dt_boxes num : 10, elapse : 0.42119741439819336\n",
      "[2023/08/30 15:59:15] ppocr DEBUG: cls num  : 10, elapse : 0.05363035202026367\n",
      "[2023/08/30 15:59:18] ppocr DEBUG: rec_res num  : 10, elapse : 2.339492082595825\n",
      "./标书实体抽取挑战赛公开数据/test/pdf/CT201410581136-三公局-支出类-劳务分包合同-45页扫描件.pdf\n",
      "|    | 要素名称                   | 要素点        |\n",
      "|---:|:---------------------------|:--------------|\n",
      "|  0 | 合同首部_买方信息_联系电话 |                |\n",
      "|  1 | 合同首部_卖方信息_名称     |                |\n",
      "|  2 | 合同首部_卖方信息_联系人   |                |\n",
      "|  3 | 合同首部_买方信息_名称     |                |\n",
      "[2023/08/30 15:59:46] ppocr DEBUG: dt_boxes num : 98, elapse : 0.49825239181518555\n",
      "[2023/08/30 15:59:46] ppocr DEBUG: cls num  : 98, elapse : 0.4916195869445801\n",
      "[2023/08/30 15:59:54] ppocr DEBUG: rec_res num  : 98, elapse : 7.586550712585449\n",
      "[2023/08/30 15:59:54] ppocr DEBUG: dt_boxes num : 14, elapse : 0.43757152557373047\n",
      "[2023/08/30 15:59:54] ppocr DEBUG: cls num  : 14, elapse : 0.0715034008026123\n",
      "[2023/08/30 15:59:56] ppocr DEBUG: rec_res num  : 14, elapse : 1.6377003192901611\n",
      "[2023/08/30 15:59:56] ppocr DEBUG: dt_boxes num : 1, elapse : 0.44554710388183594\n",
      "[2023/08/30 15:59:56] ppocr DEBUG: cls num  : 1, elapse : 0.006587505340576172\n",
      "[2023/08/30 15:59:56] ppocr DEBUG: rec_res num  : 1, elapse : 0.070831298828125\n",
      "./标书实体抽取挑战赛公开数据/test/pdf/CT201410736682-中交房地产-支出类-专业分包合同-65页扫描件.pdf\n",
      "| 页码       | 1/1      |\n",
      "| 合同审批单 | ZS06CK-  |\n",
      "| 承办日期   | 2014-10-16 |\n",
      "| 其他标记   | 无       |\n",
      "| 存档编号   | 2014-0015 |\n",
      "| 合同名称   | 中房·颐园项目一期防水工程施工承包合同 |\n",
      "| 合同主要条款 | 中房（苏州）地产有限公司 |\n",
      "| 乙方       | 河南恒腾防水防腐有限公司 |\n",
      "| 甲方       | 无       |\n",
      "| 协议标的   | 期防水工程施工 |\n",
      "| 其他协议方 | 合同签订之日起直至项目竣工 |\n",
      "| 标的金额   | 7964323.76 |\n",
      "| 履行期限   | 月进度款支付70%，验收合格支付至80%，竣工结算完成支付至95%，质保期满付 |\n",
      "| 付款时间   | 无       |\n",
      "| 备注       | 无       |\n",
      "| 审批意见   | 无       |\n",
      "| 办理状      | 无       |\n",
      "| 办理时间   | 2014-10-16 |\n",
      "| 办理人     | 刘树明    |\n",
      "| 代办人     | 无       |\n",
      "| 办理意见   | 无       |\n",
      "| 步骤       | 无       |\n",
      "| 态         | 无       |\n",
      "| 部门领导   | 同意     |\n",
      "| 股庆奎     | 无       |\n",
      "| 已办       | 无       |\n",
      "| 2         | 无       |\n",
      "| 15:34:03  | 无       |\n",
      "| 15:39:49  | 无       |\n",
      "| 审核日期     | 2014-10-16 |\n",
      "| 审核人       | 孙毅        |\n",
      "| 审核意见     | 同意        |\n",
      "| 审核时间     | 15:44:54   |\n",
      "| 审核日期     | 2014-10-16 |\n",
      "| 审核人       | 于鹏        |\n",
      "| 审核意见     | 拟同意      |\n",
      "| 审核时间     | 18:17:31   |\n",
      "| 审核日期     | 2014-10-20 |\n",
      "| 审核部门     | 合同管理    |\n",
      "| 审核人       | 戴希聪      |\n",
      "| 审核状态     | 已办        |\n",
      "| 审核次数     | 5          |\n",
      "| 审核时间     | 08:29:12   |\n",
      "| 审核日期     | 2014-10-20 |\n",
      "| 审核人       | 黄云斌      |\n",
      "| 审核部门     | 分管领导    |\n",
      "| 审核状态     | 已办        |\n",
      "| 审核意见     | 同意        |\n",
      "| 审核次数     | 6          |\n",
      "| 审核时间     | 08:33:26   |\n",
      "| 审核日期     | 2014-10-20 |\n",
      "| 审核人       | 赵武        |\n",
      "| 审核部门     | 总经理审    |\n",
      "| 审核状态     | 已办        |\n",
      "| 审核意见     | 同意        |\n",
      "| 审核次数     | 批         |\n",
      "| 审核时间     | 13:20:41   |\n",
      "| 审核日期     | 2014-10-20 |\n",
      "| 审核人       | 苏学良      |\n",
      "| 审核部门     | 办公室用    |\n",
      "| 审核状态     | 已办        |\n",
      "| 审核意见     | 已用章      |\n",
      "| 审核时间     | 14:08:00   |\n",
      "| 要素名称     | 无         |\n",
      "| 要素点       | 无         |\n",
      "| 工程地点   | 苏州市吴江区太湖新城高新路2688号（吴江中学东）   |\n",
      "| 建设单位   | 中房（苏州）地产有限公司   |\n",
      "| 施工单位   | 河南恒腾防水防腐有限公司   |\n",
      "| 签订日期   | 二0一四年10月20日   |\n",
      "[2023/08/30 16:01:10] ppocr DEBUG: dt_boxes num : 87, elapse : 0.5453324317932129\n",
      "[2023/08/30 16:01:11] ppocr DEBUG: cls num  : 87, elapse : 0.4489765167236328\n",
      "[2023/08/30 16:01:19] ppocr DEBUG: rec_res num  : 87, elapse : 8.185081958770752\n",
      "[2023/08/30 16:01:19] ppocr DEBUG: dt_boxes num : 30, elapse : 0.49924683570861816\n",
      "[2023/08/30 16:01:20] ppocr DEBUG: cls num  : 30, elapse : 0.157304048538208\n",
      "[2023/08/30 16:01:26] ppocr DEBUG: rec_res num  : 30, elapse : 6.031280040740967\n",
      "[2023/08/30 16:01:26] ppocr DEBUG: dt_boxes num : 33, elapse : 0.49126172065734863\n",
      "[2023/08/30 16:01:26] ppocr DEBUG: cls num  : 33, elapse : 0.1716313362121582\n",
      "[2023/08/30 16:01:29] ppocr DEBUG: rec_res num  : 33, elapse : 3.085801362991333\n",
      "./标书实体抽取挑战赛公开数据/test/pdf/CT201410925185-一公局-支出类-物资购销合同-5页模糊扫描件.pdf\n",
      "|    | 要素名称               | 要素点                   |\n",
      "|---:|:-----------------------|:-----------------------|\n",
      "|  0 | 合同首部_买方信息_地址 | 广西南宁交通1号线土建施工18标项目经理部 |\n",
      "|  1 | 交货_交货地点          | 广西南宁                 |\n",
      "|  2 | 交货_交货方式_风险转移 |                          |\n",
      "|  3 | 合同首部_卖方信息_名称 | 衡水市华北塑胶有限责任公司   |\n",
      "|  4 | 合同首部_买方信息_名称 | 中交隧道工程局南宁轨道     |\n",
      "|  5 | 合同首部_买方信息_地址 | 琅东站                   |\n",
      "|  6 | 交货_交货地点          | 甲方工地指定地点           |\n",
      "|  7 | 交货_交货方式_风险转移 | 乙方承担                 |\n",
      "|  8 | 合同首部_卖方信息_名称 | 天诺                     |\n",
      "|  9 | 合同首部_买方信息_名称 | 天诺                     |\n",
      "| 10 | 合同首部_买方信息_地址 | 无                       |\n",
      "| 11 | 交货_交货地点          | 无                       |\n",
      "| 12 | 交货_交货方式_风险转移 | 无                       |\n",
      "| 13 | 合同首部_卖方信息_名称 | 华万司                   |\n",
      "| 14 | 合同首部_买方信息_名称 | 无                       |\n",
      "[2023/08/30 16:02:03] ppocr DEBUG: dt_boxes num : 30, elapse : 0.5259804725646973\n",
      "[2023/08/30 16:02:03] ppocr DEBUG: cls num  : 30, elapse : 0.15927886962890625\n",
      "[2023/08/30 16:02:08] ppocr DEBUG: rec_res num  : 30, elapse : 4.838242769241333\n",
      "[2023/08/30 16:02:09] ppocr DEBUG: dt_boxes num : 27, elapse : 0.48810791969299316\n",
      "[2023/08/30 16:02:09] ppocr DEBUG: cls num  : 27, elapse : 0.14156413078308105\n",
      "[2023/08/30 16:02:15] ppocr DEBUG: rec_res num  : 27, elapse : 5.934896230697632\n",
      "[2023/08/30 16:02:15] ppocr DEBUG: dt_boxes num : 53, elapse : 0.4991583824157715\n",
      "[2023/08/30 16:02:16] ppocr DEBUG: cls num  : 53, elapse : 0.2720470428466797\n",
      "[2023/08/30 16:02:21] ppocr DEBUG: rec_res num  : 53, elapse : 4.972649574279785\n",
      "./标书实体抽取挑战赛公开数据/test/pdf/CT201410957473-中交疏浚-支出类-专业分包合同-10页扫描件.pdf\n",
      "|    | 要素名称                                 | 要素点       |\n",
      "|---:|:-----------------------------------------|:-------------|\n",
      "|  0 | 合同标的额小写                           |              |\n",
      "|  1 | 验收_验收标准                            |              |\n",
      "|  2 | 合同正文_合同签订地                      |              |\n",
      "|  3 | 收款方银行信息_账户名称                  |              |\n",
      "|  4 | 违约责任_卖方责任_产品不符合约定责任条款 |              |\n",
      "|  5 | 合同首部_卖方信息_名称                   |              |\n",
      "[2023/08/30 16:02:51] ppocr DEBUG: dt_boxes num : 8, elapse : 0.5273046493530273\n",
      "[2023/08/30 16:02:51] ppocr DEBUG: cls num  : 8, elapse : 0.047522544860839844\n",
      "[2023/08/30 16:02:52] ppocr DEBUG: rec_res num  : 8, elapse : 1.0457954406738281\n",
      "[2023/08/30 16:02:52] ppocr DEBUG: dt_boxes num : 20, elapse : 0.48706650733947754\n",
      "[2023/08/30 16:02:52] ppocr DEBUG: cls num  : 20, elapse : 0.1041257381439209\n",
      "[2023/08/30 16:02:56] ppocr DEBUG: rec_res num  : 20, elapse : 3.1577980518341064\n",
      "[2023/08/30 16:02:56] ppocr DEBUG: dt_boxes num : 20, elapse : 0.5038108825683594\n",
      "[2023/08/30 16:02:56] ppocr DEBUG: cls num  : 20, elapse : 0.10841131210327148\n",
      "[2023/08/30 16:03:00] ppocr DEBUG: rec_res num  : 20, elapse : 4.057368755340576\n",
      "./标书实体抽取挑战赛公开数据/test/pdf/CT201411033436-信科集团-支出类-设备 (含船机)购销合同-28页扫描件.pdf\n",
      "|    | 要素名称                   | 要素点   |\n",
      "|---:|:---------------------------|:---------|\n",
      "|  0 | 合同首部_买方信息_地址     |          |\n",
      "|  1 | 合同尾部_买方信息_名称     |          |\n",
      "|  2 | 合同尾部_卖方信息_联系方式 |          |\n",
      "|  3 | 售后服务_质保_质保内容     |          |\n",
      "|  4 | 生效_生效条件              |          |\n",
      "|  5 | 合同尾部_卖方信息_名称     |          |\n",
      "|  6 | 合同正文_签订日期值        |          |\n",
      "|  7 | 收款方银行信息_开户行      |          |\n",
      "[2023/08/30 16:03:29] ppocr DEBUG: dt_boxes num : 4, elapse : 0.5230638980865479\n",
      "[2023/08/30 16:03:29] ppocr DEBUG: cls num  : 4, elapse : 0.0287477970123291\n",
      "[2023/08/30 16:03:30] ppocr DEBUG: rec_res num  : 4, elapse : 1.0129344463348389\n",
      "[2023/08/30 16:03:30] ppocr DEBUG: dt_boxes num : 27, elapse : 0.5067546367645264\n",
      "[2023/08/30 16:03:30] ppocr DEBUG: cls num  : 27, elapse : 0.1440272331237793\n",
      "[2023/08/30 16:03:35] ppocr DEBUG: rec_res num  : 27, elapse : 4.779938697814941\n",
      "[2023/08/30 16:03:36] ppocr DEBUG: dt_boxes num : 51, elapse : 0.4984285831451416\n",
      "[2023/08/30 16:03:36] ppocr DEBUG: cls num  : 51, elapse : 0.2557389736175537\n",
      "[2023/08/30 16:03:40] ppocr DEBUG: rec_res num  : 51, elapse : 3.9146742820739746\n",
      "./标书实体抽取挑战赛公开数据/test/pdf/CT201411131833-一公院-支出类-设备 (含船机)购销合同-10页扫描件.pdf\n",
      "|    | 要素名称                       | 要素点   |\n",
      "|---:|:-------------------------------|:---------|\n",
      "|  0 | 合同尾部_卖方信息_名称         | 商洛市商州区华恒工程设备租赁有限责任公司 |\n",
      "|  1 | 小写金额                       | 187791.81|\n",
      "|  2 | 日期                           | 无       |\n",
      "|  3 | 合同尾部_买方信息_联系方式     | 无       |\n",
      "|  4 | 合同首部_卖方信息_名称         | 西安中交公路岩土工程有限责任公司 |\n",
      "|  5 | 违约责任_买方责任_解除合同     | 无       |\n",
      "|  6 | 收款方银行信息_银行账号        | 无       |\n",
      "|  7 | 合同尾部_买方信息_名称         | 商洛市商州区华恒工程设备租赁有限责任公司 |\n",
      "|  8 | 争议解决方式_管辖法院          | 无       |\n",
      "|  9 | 大写金额                       | 无       |\n",
      "| 10 | 生效_生效时间                  | 无       |\n",
      "| 11 | 开票_买方开票信息_纳税人识别号 | 无       |\n",
      "| 12 | 生效_生效条件                  | 无       |\n",
      "[2023/08/30 16:04:16] ppocr DEBUG: dt_boxes num : 9, elapse : 0.5291523933410645\n",
      "[2023/08/30 16:04:16] ppocr DEBUG: cls num  : 9, elapse : 0.05178642272949219\n",
      "[2023/08/30 16:04:17] ppocr DEBUG: rec_res num  : 9, elapse : 0.9133610725402832\n",
      "[2023/08/30 16:04:18] ppocr DEBUG: dt_boxes num : 53, elapse : 0.5072095394134521\n",
      "[2023/08/30 16:04:18] ppocr DEBUG: cls num  : 53, elapse : 0.27575039863586426\n",
      "[2023/08/30 16:04:23] ppocr DEBUG: rec_res num  : 53, elapse : 4.81021785736084\n",
      "[2023/08/30 16:04:24] ppocr DEBUG: dt_boxes num : 44, elapse : 0.5106608867645264\n",
      "[2023/08/30 16:04:24] ppocr DEBUG: cls num  : 44, elapse : 0.23021221160888672\n",
      "[2023/08/30 16:04:28] ppocr DEBUG: rec_res num  : 44, elapse : 4.3201727867126465\n",
      "./标书实体抽取挑战赛公开数据/test/pdf/CT201411316563-中交建筑-收入类-施工（总）承包-6页扫描件.pdf\n",
      "|    | 要素名称                   | 要素点   |\n",
      "|---:|:---------------------------|:---------|\n",
      "|  0 | 合同标的_用途_标的物用途   |          |\n",
      "|  1 | 合同正文_签订日期值        |          |\n",
      "|  2 | 合同标的额大写             |          |\n",
      "|  3 | 合同标的额小写             |          |\n",
      "|  4 | 合同首部_买方信息_名称     |          |\n",
      "|  5 | 合同正文_合同签订地        |          |\n",
      "|  6 | 生效_生效时间              |          |\n",
      "|  7 | 合同尾部_买方信息_联系方式 |          |\n",
      "|  8 | 合同首部_卖方信息_名称     |          |\n",
      "|  9 | 合同尾部_买方信息_地址     |          |\n",
      "| 10 | 收款方银行信息_银行账号    |          |\n",
      "| 11 | 收款方银行信息_银行账号    |          |\n",
      "| 12 | 生效_生效条件              |          |\n",
      "[2023/08/30 16:05:18] ppocr DEBUG: dt_boxes num : 50, elapse : 0.5376276969909668\n",
      "[2023/08/30 16:05:18] ppocr DEBUG: cls num  : 50, elapse : 0.25304651260375977\n",
      "[2023/08/30 16:05:27] ppocr DEBUG: rec_res num  : 50, elapse : 8.435013771057129\n",
      "[2023/08/30 16:05:27] ppocr DEBUG: dt_boxes num : 40, elapse : 0.4977114200592041\n",
      "[2023/08/30 16:05:27] ppocr DEBUG: cls num  : 40, elapse : 0.20215749740600586\n",
      "[2023/08/30 16:05:36] ppocr DEBUG: rec_res num  : 40, elapse : 8.441447496414185\n",
      "[2023/08/30 16:05:36] ppocr DEBUG: dt_boxes num : 46, elapse : 0.5004799365997314\n",
      "[2023/08/30 16:05:37] ppocr DEBUG: cls num  : 46, elapse : 0.23769569396972656\n",
      "[2023/08/30 16:05:44] ppocr DEBUG: rec_res num  : 46, elapse : 7.5654072761535645\n",
      "./标书实体抽取挑战赛公开数据/test/pdf/CT201411334205-四航局-支出类-劳务分包合同-17页扫描件.pdf\n",
      "|    | 要素名称                         | 要素点             |\n",
      "|---:|:---------------------------------|:-----------------|\n",
      "|  0 | 送达_指定通讯地址                | 无                |\n",
      "|  1 | 合同首部_卖方信息_地址           | 无                |\n",
      "|  2 | 合同标的额小写                   | 无                |\n",
      "|  3 | 日期                             | 2014年3月2日      |\n",
      "|  4 | 送达_买方受送达人信息_联系人     | 无                |\n",
      "|  5 | 合同首部_卖方信息_名称           | 无                |\n",
      "|  6 | 支付时间及方式_支付方式_支付比例 | 无                |\n",
      "|  7 | 生效_生效条件                    | 同等法律效力      |\n",
      "[2023/08/30 16:06:16] ppocr DEBUG: dt_boxes num : 13, elapse : 0.5261790752410889\n",
      "[2023/08/30 16:06:16] ppocr DEBUG: cls num  : 13, elapse : 0.0743246078491211\n",
      "[2023/08/30 16:06:17] ppocr DEBUG: rec_res num  : 13, elapse : 1.157332181930542\n",
      "[2023/08/30 16:06:18] ppocr DEBUG: dt_boxes num : 83, elapse : 0.51458740234375\n",
      "[2023/08/30 16:06:18] ppocr DEBUG: cls num  : 83, elapse : 0.43129777908325195\n",
      "[2023/08/30 16:06:26] ppocr DEBUG: rec_res num  : 83, elapse : 8.008437871932983\n",
      "[2023/08/30 16:06:27] ppocr DEBUG: dt_boxes num : 23, elapse : 0.49256348609924316\n",
      "[2023/08/30 16:06:27] ppocr DEBUG: cls num  : 23, elapse : 0.1223900318145752\n",
      "[2023/08/30 16:06:29] ppocr DEBUG: rec_res num  : 23, elapse : 1.6205251216888428\n",
      "./标书实体抽取挑战赛公开数据/test/pdf/CT201511143732-西筑公司-收入类-劳务分包合同-5页扫描件.pdf\n",
      "|    | 要素名称               | 要素点   |\n",
      "|---:|:-----------------------|:---------|\n",
      "|  0 | 合同正文_签订日期值    |          |\n",
      "|  1 | 生效_生效时间          |          |\n",
      "|  2 | 合同首部_卖方信息_名称 |          |\n",
      "|  3 | 合同首部_买方信息_名称 |          |\n",
      "[2023/08/30 16:06:52] ppocr DEBUG: dt_boxes num : 4, elapse : 0.5141341686248779\n",
      "[2023/08/30 16:06:52] ppocr DEBUG: cls num  : 4, elapse : 0.02787494659423828\n",
      "[2023/08/30 16:06:52] ppocr DEBUG: rec_res num  : 4, elapse : 0.4376857280731201\n",
      "[2023/08/30 16:06:53] ppocr DEBUG: dt_boxes num : 23, elapse : 0.4855818748474121\n",
      "[2023/08/30 16:06:53] ppocr DEBUG: cls num  : 23, elapse : 0.12089014053344727\n",
      "[2023/08/30 16:06:57] ppocr DEBUG: rec_res num  : 23, elapse : 3.944639205932617\n",
      "[2023/08/30 16:06:57] ppocr DEBUG: dt_boxes num : 17, elapse : 0.48569583892822266\n",
      "[2023/08/30 16:06:57] ppocr DEBUG: cls num  : 17, elapse : 0.09240269660949707\n",
      "[2023/08/30 16:06:59] ppocr DEBUG: rec_res num  : 17, elapse : 1.3837933540344238\n",
      "./标书实体抽取挑战赛公开数据/test/pdf/CT201611379239-中国城乡-收入类-其他工程类合同-5页扫描件.pdf\n",
      "        |    | 要素名称                         | 要素点         |\n",
      "|---:|:---------------------------------|:-------------|\n",
      "|  0 | 支付时间及方式_支付方式_支付金额 |              |\n",
      "|  1 | 支付时间及方式_支付方式_支付金额 |              |\n",
      "|  2 | 合同首部_卖方信息_名称           |              |\n",
      "|  3 | 合同首部_买方信息_名称           |              |\n",
      "|  4 | 合同尾部_卖方信息_联系人         |              |\n",
      "|  5 | 违约责任_卖方责任_责任条款       |              |\n",
      "|  6 | 生效_生效条件                    |              |\n",
      "[2023/08/30 16:07:19] ppocr DEBUG: dt_boxes num : 7, elapse : 0.4810788631439209\n",
      "[2023/08/30 16:07:19] ppocr DEBUG: cls num  : 7, elapse : 0.03885364532470703\n",
      "[2023/08/30 16:07:20] ppocr DEBUG: rec_res num  : 7, elapse : 1.0726256370544434\n",
      "[2023/08/30 16:07:20] ppocr DEBUG: dt_boxes num : 6, elapse : 0.4365963935852051\n",
      "[2023/08/30 16:07:20] ppocr DEBUG: cls num  : 6, elapse : 0.03170156478881836\n",
      "[2023/08/30 16:07:21] ppocr DEBUG: rec_res num  : 6, elapse : 1.1278295516967773\n",
      "[2023/08/30 16:07:22] ppocr DEBUG: dt_boxes num : 6, elapse : 0.483165979385376\n",
      "[2023/08/30 16:07:22] ppocr DEBUG: cls num  : 6, elapse : 0.04150676727294922\n",
      "[2023/08/30 16:07:24] ppocr DEBUG: rec_res num  : 6, elapse : 2.0789475440979004\n",
      "./标书实体抽取挑战赛公开数据/test/pdf/CT201710190380-一航局-收入类-设计施工总承包合同-85页扫描件.pdf\n",
      "【输出信息】\n",
      "|    | 要素名称               | 要素点   |\n",
      "|---:|:-----------------------|:---------|\n",
      "|  0 | 合同首部_卖方信息_名称 |          |\n",
      "|  1 | 合同首部_买方信息_名称 |          |\n",
      "[2023/08/30 16:07:34] ppocr DEBUG: dt_boxes num : 9, elapse : 0.531012773513794\n",
      "[2023/08/30 16:07:34] ppocr DEBUG: cls num  : 9, elapse : 0.0529634952545166\n",
      "[2023/08/30 16:07:36] ppocr DEBUG: rec_res num  : 9, elapse : 1.3107244968414307\n",
      "[2023/08/30 16:07:36] ppocr DEBUG: dt_boxes num : 26, elapse : 0.48418521881103516\n",
      "[2023/08/30 16:07:36] ppocr DEBUG: cls num  : 26, elapse : 0.13499164581298828\n",
      "[2023/08/30 16:07:41] ppocr DEBUG: rec_res num  : 26, elapse : 4.612363338470459\n",
      "[2023/08/30 16:07:42] ppocr DEBUG: dt_boxes num : 28, elapse : 0.48612189292907715\n",
      "[2023/08/30 16:07:42] ppocr DEBUG: cls num  : 28, elapse : 0.14315009117126465\n",
      "[2023/08/30 16:07:45] ppocr DEBUG: rec_res num  : 28, elapse : 3.0611658096313477\n",
      "./标书实体抽取挑战赛公开数据/test/pdf/CT201710984626-中交建筑-收入类-内部任务书-4页扫描件.pdf\n",
      "|    | 要素名称                 | 要素点       |\n",
      "|---:|:-------------------------|:-------------|\n",
      "|  0 | 合同尾部_卖方信息_名称   |                  |\n",
      "|  1 | 合同尾部_卖方信息_地址   |                  |\n",
      "|  2 | 合同标的额小写           |                  |\n",
      "|  3 | 合同正文_合同签订地      |                  |\n",
      "|  4 | 合同首部_卖方信息_名称   |                  |\n",
      "|  5 | 合同标的_用途_标的物用途 |                  |\n",
      "|  6 | 合同尾部_买方信息_名称   |                  |\n",
      "|  7 | 合同标的额大写           |                  |\n",
      "|  8 | 生效_生效条件            |                  |\n",
      "[2023/08/30 16:08:57] ppocr DEBUG: dt_boxes num : 28, elapse : 0.49907636642456055\n",
      "[2023/08/30 16:08:57] ppocr DEBUG: cls num  : 28, elapse : 0.14592480659484863\n",
      "[2023/08/30 16:09:01] ppocr DEBUG: rec_res num  : 28, elapse : 3.38533616065979\n",
      "[2023/08/30 16:09:01] ppocr DEBUG: dt_boxes num : 33, elapse : 0.4514734745025635\n",
      "[2023/08/30 16:09:01] ppocr DEBUG: cls num  : 33, elapse : 0.16539716720581055\n",
      "[2023/08/30 16:09:09] ppocr DEBUG: rec_res num  : 33, elapse : 7.398618698120117\n",
      "[2023/08/30 16:09:10] ppocr DEBUG: dt_boxes num : 37, elapse : 0.49551963806152344\n",
      "[2023/08/30 16:09:10] ppocr DEBUG: cls num  : 37, elapse : 0.19422364234924316\n",
      "[2023/08/30 16:09:15] ppocr DEBUG: rec_res num  : 37, elapse : 4.808817148208618\n",
      "./标书实体抽取挑战赛公开数据/test/pdf/CT201711260968-四航局-收入类-设计施工采购总承包合同-150页扫描件.pdf\n",
      "|    | 要素名称                 | 要素点   |\n",
      "|---:|:-------------------------|:---------|\n",
      "|  0 | 合同标的_用途_标的物用途 | 深圳机场三跑道扩建工程场地陆域形成及软基处理工程 |\n",
      "|  1 | 合同标的额大写           | 无       |\n",
      "|  2 | 日期                     | 2017年三月   |\n",
      "|  3 | 合同标的额小写           | 无       |\n",
      "|  4 | 合同首部_买方信息_名称   | 深圳市土地投资开发中心   |\n",
      "[2023/08/30 16:09:45] ppocr DEBUG: dt_boxes num : 13, elapse : 0.5240025520324707\n",
      "[2023/08/30 16:09:45] ppocr DEBUG: cls num  : 13, elapse : 0.07386040687561035\n",
      "[2023/08/30 16:09:46] ppocr DEBUG: rec_res num  : 13, elapse : 1.6263036727905273\n",
      "[2023/08/30 16:09:47] ppocr DEBUG: dt_boxes num : 26, elapse : 0.45124173164367676\n",
      "[2023/08/30 16:09:47] ppocr DEBUG: cls num  : 26, elapse : 0.13123130798339844\n",
      "[2023/08/30 16:09:53] ppocr DEBUG: rec_res num  : 26, elapse : 6.200353384017944\n",
      "[2023/08/30 16:09:54] ppocr DEBUG: dt_boxes num : 19, elapse : 0.4937312602996826\n",
      "[2023/08/30 16:09:54] ppocr DEBUG: cls num  : 19, elapse : 0.10223269462585449\n",
      "[2023/08/30 16:09:55] ppocr DEBUG: rec_res num  : 19, elapse : 1.350376844406128\n",
      "./标书实体抽取挑战赛公开数据/test/pdf/CT201711459614-中交疏浚-收入类-设计施工总承包合同-31页扫描件.pdf\n",
      "【输出结果】\n",
      "|    | 要素名称                 | 要素点   |\n",
      "|---:|:-------------------------|:---------|\n",
      "|  0 | 合同标的_用途_标的物用途 |          |\n",
      "|  1 | 合同正文_签订日期值      |          |\n",
      "|  2 | 合同正文_合同签订地      |          |\n",
      "|  3 | 日期                     |          |\n",
      "|  4 | 合同首部_卖方信息_名称   |          |\n",
      "|  5 | 合同首部_买方信息_名称   |          |\n",
      "[2023/08/30 16:10:09] ppocr DEBUG: dt_boxes num : 28, elapse : 0.5767755508422852\n",
      "[2023/08/30 16:10:09] ppocr DEBUG: cls num  : 28, elapse : 0.1499333381652832\n",
      "[2023/08/30 16:10:13] ppocr DEBUG: rec_res num  : 28, elapse : 3.950010061264038\n",
      "[2023/08/30 16:10:14] ppocr DEBUG: dt_boxes num : 30, elapse : 0.5232760906219482\n",
      "[2023/08/30 16:10:14] ppocr DEBUG: cls num  : 30, elapse : 0.1566755771636963\n",
      "[2023/08/30 16:10:18] ppocr DEBUG: rec_res num  : 30, elapse : 4.0709569454193115\n",
      "[2023/08/30 16:10:19] ppocr DEBUG: dt_boxes num : 30, elapse : 0.5233287811279297\n",
      "[2023/08/30 16:10:19] ppocr DEBUG: cls num  : 30, elapse : 0.1552436351776123\n",
      "[2023/08/30 16:10:23] ppocr DEBUG: rec_res num  : 30, elapse : 4.29282283782959\n",
      "./标书实体抽取挑战赛公开数据/test/pdf/CT201810171842-中交路建-收入类-赔偿、补偿类合同-4页扫描件.pdf\n",
      "|    | 要素名称                         | 要素点   |\n",
      "|---:|:---------------------------------|:---------|\n",
      "|  0 | 数量_合同原件数量                |    4份      |\n",
      "|  1 | 支付时间及方式_支付方式_支付金额 |   一次性付争议地款贰万贰仟元整     |\n",
      "|  2 | 小写金额                         |   22000元     |\n",
      "|    | 要素名称                         | 要素点   |\n",
      "|---:|:---------------------------------|:---------|\n",
      "|  0 | 数量_合同原件数量                |   4份    |\n",
      "|  1 | 支付时间及方式_支付方式_支付金额 |  一次性付争议地款柒仟元整（7000元）  |\n",
      "|  2 | 小写金额                         |   7000元   |\n",
      "|    | 要素名称                         | 要素点   |\n",
      "|---:|:---------------------------------|:---------|\n",
      "|  0 | 数量_合同原件数量                |          |\n",
      "|  1 | 支付时间及方式_支付方式_支付金额 |          |\n",
      "|  2 | 小写金额                         |          |\n",
      "[2023/08/30 16:10:51] ppocr DEBUG: dt_boxes num : 59, elapse : 0.4953176975250244\n",
      "[2023/08/30 16:10:51] ppocr DEBUG: cls num  : 59, elapse : 0.2873966693878174\n",
      "[2023/08/30 16:10:56] ppocr DEBUG: rec_res num  : 59, elapse : 4.718190908432007\n",
      "[2023/08/30 16:10:57] ppocr DEBUG: dt_boxes num : 38, elapse : 0.4487130641937256\n",
      "[2023/08/30 16:10:57] ppocr DEBUG: cls num  : 38, elapse : 0.19416356086730957\n",
      "[2023/08/30 16:10:59] ppocr DEBUG: rec_res num  : 38, elapse : 2.6094324588775635\n",
      "[2023/08/30 16:11:00] ppocr DEBUG: dt_boxes num : 115, elapse : 0.5270006656646729\n",
      "[2023/08/30 16:11:01] ppocr DEBUG: cls num  : 115, elapse : 0.567681074142456\n",
      "[2023/08/30 16:11:10] ppocr DEBUG: rec_res num  : 115, elapse : 9.089906930923462\n",
      "./标书实体抽取挑战赛公开数据/test/pdf/CT201810217655-一航局-收入类-专业分包合同-68页扫描件.pdf\n",
      "【待填充表格】\n",
      "|    | 要素名称            | 要素点   |\n",
      "|---:|:--------------------|:---------|\n",
      "|  0 | 合同正文_签订日期值 |          |\n",
      "[2023/08/30 16:11:29] ppocr DEBUG: dt_boxes num : 5, elapse : 0.5178673267364502\n",
      "[2023/08/30 16:11:29] ppocr DEBUG: cls num  : 5, elapse : 0.031466007232666016\n",
      "[2023/08/30 16:11:30] ppocr DEBUG: rec_res num  : 5, elapse : 0.9830682277679443\n",
      "[2023/08/30 16:11:31] ppocr DEBUG: dt_boxes num : 69, elapse : 0.49852800369262695\n",
      "[2023/08/30 16:11:31] ppocr DEBUG: cls num  : 69, elapse : 0.3572242259979248\n",
      "[2023/08/30 16:11:37] ppocr DEBUG: rec_res num  : 69, elapse : 6.120898008346558\n",
      "[2023/08/30 16:11:38] ppocr DEBUG: dt_boxes num : 10, elapse : 0.48001670837402344\n",
      "[2023/08/30 16:11:38] ppocr DEBUG: cls num  : 10, elapse : 0.056572914123535156\n",
      "[2023/08/30 16:11:39] ppocr DEBUG: rec_res num  : 10, elapse : 0.9972615242004395\n",
      "./标书实体抽取挑战赛公开数据/test/pdf/CT201811444794-四航局-收入类-采购施工总承包-6页扫描件.pdf\n",
      "|    | 要素名称               | 要素点              |\n",
      "|---:|:-----------------------|:------------------|\n",
      "|  0 | 合同首部_卖方信息_名称 | 中交第四航局工程局有限公司 |\n",
      "|  1 | 合同首部_买方信息_名称 | 中马公共工程公司     |\n",
      "|  2 | 合同首部_卖方信息_名称 | 小松PC350-8          |\n",
      "|  3 | 合同首部_买方信息_名称 | 徐工ZL50GN          |\n",
      "[2023/08/30 16:11:59] ppocr DEBUG: dt_boxes num : 8, elapse : 0.5178639888763428\n",
      "[2023/08/30 16:11:59] ppocr DEBUG: cls num  : 8, elapse : 0.04571223258972168\n",
      "[2023/08/30 16:12:00] ppocr DEBUG: rec_res num  : 8, elapse : 1.3253793716430664\n",
      "[2023/08/30 16:12:01] ppocr DEBUG: dt_boxes num : 13, elapse : 0.44820094108581543\n",
      "[2023/08/30 16:12:01] ppocr DEBUG: cls num  : 13, elapse : 0.06503462791442871\n",
      "[2023/08/30 16:12:03] ppocr DEBUG: rec_res num  : 13, elapse : 2.093883752822876\n",
      "[2023/08/30 16:12:03] ppocr DEBUG: dt_boxes num : 22, elapse : 0.48333001136779785\n",
      "[2023/08/30 16:12:03] ppocr DEBUG: cls num  : 22, elapse : 0.11460232734680176\n",
      "[2023/08/30 16:12:06] ppocr DEBUG: rec_res num  : 22, elapse : 2.9645586013793945\n",
      "./标书实体抽取挑战赛公开数据/test/pdf/CT202010023734-二公院-收入类-设计施工总承包合同-36页扫描件.pdf\n",
      "|    | 要素名称                           | 要素点   |\n",
      "|---:|:-----------------------------------|:---------|\n",
      "|  0 | 合同尾部_卖方信息_名称             |          |\n",
      "|  1 | 合同标的额小写                     |          |\n",
      "|  2 | 违约责任_买方责任_逾期付款责任条款 |          |\n",
      "|  3 | 违约责任_买方责任_逾期付款责任条款 |          |\n",
      "|  4 | 不可抗力_不可抗力范围              |          |\n",
      "|  5 | 合同首部_卖方信息_名称             |          |\n",
      "[2023/08/30 16:12:23] ppocr DEBUG: dt_boxes num : 24, elapse : 0.5256226062774658\n",
      "[2023/08/30 16:12:23] ppocr DEBUG: cls num  : 24, elapse : 0.12494134902954102\n",
      "[2023/08/30 16:12:29] ppocr DEBUG: rec_res num  : 24, elapse : 5.550778388977051\n",
      "[2023/08/30 16:12:29] ppocr DEBUG: dt_boxes num : 20, elapse : 0.4945857524871826\n",
      "[2023/08/30 16:12:29] ppocr DEBUG: cls num  : 20, elapse : 0.10773110389709473\n",
      "[2023/08/30 16:12:33] ppocr DEBUG: rec_res num  : 20, elapse : 4.0661540031433105\n",
      "[2023/08/30 16:12:34] ppocr DEBUG: dt_boxes num : 42, elapse : 0.49214601516723633\n",
      "[2023/08/30 16:12:34] ppocr DEBUG: cls num  : 42, elapse : 0.2190718650817871\n",
      "[2023/08/30 16:12:38] ppocr DEBUG: rec_res num  : 42, elapse : 4.300669193267822\n",
      "./标书实体抽取挑战赛公开数据/test/pdf/CT202110330559-三航局-收入类-赔偿、补偿类合同-3页扫描件.pdf\n",
      "|    | 要素名称                | 要素点                       |\n",
      "|---:|:------------------------|:-----------------------------|\n",
      "|  0 | 合同尾部_卖方信息_名称  |                             |\n",
      "|  1 | 合同尾部_买方信息_地址  |                             |\n",
      "|  2 | 收款方银行信息_银行账号 |                             |\n",
      "|  3 | 合同尾部_买方信息_名称  |                             |\n",
      "|  4 | 收款方银行信息_开户行   |                             |\n",
      "|  5 | 争议解决方式_管辖法院   |                             |\n",
      "|  6 | 生效_生效时间           |                             |\n",
      "|  7 | 生效_生效条件           |                             |\n",
      "[2023/08/30 16:13:06] ppocr DEBUG: dt_boxes num : 13, elapse : 0.5216987133026123\n",
      "[2023/08/30 16:13:06] ppocr DEBUG: cls num  : 13, elapse : 0.0726318359375\n",
      "[2023/08/30 16:13:07] ppocr DEBUG: rec_res num  : 13, elapse : 1.489478349685669\n",
      "[2023/08/30 16:13:08] ppocr DEBUG: dt_boxes num : 49, elapse : 0.4922451972961426\n",
      "[2023/08/30 16:13:08] ppocr DEBUG: cls num  : 49, elapse : 0.2566795349121094\n",
      "[2023/08/30 16:13:16] ppocr DEBUG: rec_res num  : 49, elapse : 7.299708127975464\n",
      "[2023/08/30 16:13:16] ppocr DEBUG: dt_boxes num : 83, elapse : 0.5039060115814209\n",
      "[2023/08/30 16:13:17] ppocr DEBUG: cls num  : 83, elapse : 0.4210062026977539\n",
      "[2023/08/30 16:13:23] ppocr DEBUG: rec_res num  : 83, elapse : 5.954737901687622\n",
      "./标书实体抽取挑战赛公开数据/test/pdf/CT202110629429-四航局-收入类-赔偿、补偿类合同-3页扫描件.pdf\n",
      "|    | 要素名称               | 要素点   |\n",
      "|---:|:-----------------------|:---------|\n",
      "|  0 | 合同尾部_卖方信息_名称 |          |\n",
      "|  1 | 开票_发票_类型         |          |\n",
      "|  2 | 合同标的额小写         |          |\n",
      "|  3 | 合同尾部_买方信息_名称 |          |\n",
      "|  4 | 合同标的额大写         |          |\n",
      "|  5 | 合同首部_买方信息_名称 |          |\n",
      "|  6 | 生效_生效条件          |          |\n",
      "[2023/08/30 16:14:01] ppocr DEBUG: dt_boxes num : 13, elapse : 0.5183656215667725\n",
      "[2023/08/30 16:14:01] ppocr DEBUG: cls num  : 13, elapse : 0.07335448265075684\n",
      "[2023/08/30 16:14:03] ppocr DEBUG: rec_res num  : 13, elapse : 2.066755533218384\n",
      "[2023/08/30 16:14:04] ppocr DEBUG: dt_boxes num : 18, elapse : 0.4426732063293457\n",
      "[2023/08/30 16:14:04] ppocr DEBUG: cls num  : 18, elapse : 0.09092521667480469\n",
      "[2023/08/30 16:14:06] ppocr DEBUG: rec_res num  : 18, elapse : 1.8806483745574951\n",
      "[2023/08/30 16:14:06] ppocr DEBUG: dt_boxes num : 1, elapse : 0.47429656982421875\n",
      "[2023/08/30 16:14:06] ppocr DEBUG: cls num  : 1, elapse : 0.01145792007446289\n",
      "[2023/08/30 16:14:06] ppocr DEBUG: rec_res num  : 1, elapse : 0.07058215141296387\n",
      "./标书实体抽取挑战赛公开数据/test/pdf/CT202211297356-一航局-收入类-设计施工总承包合同-34页扫描件.pdf\n",
      "【表格最终格式】\n",
      "        \n",
      "|    | 要素名称               | 要素点   |\n",
      "|---:|:-----------------------|:---------|\n",
      "|  0 | 合同首部_买方信息_名称 |          |\n",
      "[2023/08/30 16:15:02] ppocr DEBUG: dt_boxes num : 20, elapse : 0.48875975608825684\n",
      "[2023/08/30 16:15:02] ppocr DEBUG: cls num  : 20, elapse : 0.10358190536499023\n",
      "[2023/08/30 16:15:05] ppocr DEBUG: rec_res num  : 20, elapse : 2.4604973793029785\n",
      "[2023/08/30 16:15:05] ppocr DEBUG: dt_boxes num : 0, elapse : 0.43137073516845703\n",
      "[2023/08/30 16:15:05] ppocr DEBUG: cls num  : 0, elapse : 0\n",
      "[2023/08/30 16:15:05] ppocr DEBUG: rec_res num  : 0, elapse : 1.6689300537109375e-06\n",
      "[2023/08/30 16:15:06] ppocr DEBUG: dt_boxes num : 20, elapse : 0.4400155544281006\n",
      "[2023/08/30 16:15:06] ppocr DEBUG: cls num  : 20, elapse : 0.10244894027709961\n",
      "[2023/08/30 16:15:10] ppocr DEBUG: rec_res num  : 20, elapse : 4.0797224044799805\n",
      "./标书实体抽取挑战赛公开数据/test/pdf/CT202211379269-四航局-收入类-采购施工总承包-92页扫描件.pdf\n",
      "|    | 要素名称               | 要素点   |\n",
      "|---:|:-----------------------|:---------|\n",
      "|  0 | 合同正文_签订日期值    |          |\n",
      "|  1 | 合同标的额大写         |          |\n",
      "|  2 | 开票_发票_税率         |          |\n",
      "|  3 | 售后服务_质保_质保期   |          |\n",
      "|  4 | 合同标的额小写         |          |\n",
      "|  5 | 合同首部_买方信息_名称 |          |\n",
      "|  6 | 合同首部_卖方信息_名称 |          |\n",
      "|  7 | 生效_生效条件          |          |\n",
      "[2023/08/30 16:15:35] ppocr DEBUG: dt_boxes num : 22, elapse : 0.5226869583129883\n",
      "[2023/08/30 16:15:35] ppocr DEBUG: cls num  : 22, elapse : 0.1189887523651123\n",
      "[2023/08/30 16:15:39] ppocr DEBUG: rec_res num  : 22, elapse : 3.940237283706665\n",
      "[2023/08/30 16:15:40] ppocr DEBUG: dt_boxes num : 22, elapse : 0.4457981586456299\n",
      "[2023/08/30 16:15:40] ppocr DEBUG: cls num  : 22, elapse : 0.10796046257019043\n",
      "[2023/08/30 16:15:44] ppocr DEBUG: rec_res num  : 22, elapse : 4.521667957305908\n",
      "[2023/08/30 16:15:45] ppocr DEBUG: dt_boxes num : 31, elapse : 0.4858365058898926\n",
      "[2023/08/30 16:15:45] ppocr DEBUG: cls num  : 31, elapse : 0.16125130653381348\n",
      "[2023/08/30 16:15:50] ppocr DEBUG: rec_res num  : 31, elapse : 5.594692945480347\n",
      "./标书实体抽取挑战赛公开数据/test/pdf/CT202211460211-四航局-收入类-设计施工采购总承包合同-27页扫描件.pdf\n",
      "|    | 要素名称                   | 要素点                                          |\n",
      "|---:|:---------------------------|:----------------------------------------------|\n",
      "|  0 | 合同标的_用途_标的物用途   | 尼日利亚液化天然气有限公司T7项目LNG码头新建工程        |\n",
      "|  1 | 合同首部_买方信息_地址     | PLOT 3140,MURTALA MOHAMMED EXPRESSWAY，(BESIDE RAHAMANIYYA FILLING STATION, CLOSE TO MPAPE JUNCTION),ABUJA FCT. NIGERIA |\n",
      "|  2 | 合同标的额小写             | 无                                              |\n",
      "|  3 | 合同首部_买方信息_名称     | 中国港湾（尼日利亚）有限公司                          |\n",
      "|  4 | 生效_生效时间              | 2022年5月7日                                    |\n",
      "|  5 | 期限_合同期限届满终止条款  | 2022年6月30日                                    |\n",
      "|  6 | 合同首部_卖方信息_名称     | 中交第四航务工程局有限公司                            |\n",
      "|  7 | 违约责任_卖方责任_责任条款 | 无                                              |\n",
      "[2023/08/30 16:16:30] ppocr DEBUG: dt_boxes num : 17, elapse : 0.4892251491546631\n",
      "[2023/08/30 16:16:30] ppocr DEBUG: cls num  : 17, elapse : 0.08610415458679199\n",
      "[2023/08/30 16:16:33] ppocr DEBUG: rec_res num  : 17, elapse : 2.3595244884490967\n",
      "[2023/08/30 16:16:33] ppocr DEBUG: dt_boxes num : 31, elapse : 0.4663660526275635\n",
      "[2023/08/30 16:16:33] ppocr DEBUG: cls num  : 31, elapse : 0.15280508995056152\n",
      "[2023/08/30 16:16:39] ppocr DEBUG: rec_res num  : 31, elapse : 5.838087558746338\n",
      "[2023/08/30 16:16:40] ppocr DEBUG: dt_boxes num : 39, elapse : 0.50724196434021\n",
      "[2023/08/30 16:16:40] ppocr DEBUG: cls num  : 39, elapse : 0.2020251750946045\n",
      "[2023/08/30 16:16:46] ppocr DEBUG: rec_res num  : 39, elapse : 6.195063829421997\n",
      "./标书实体抽取挑战赛公开数据/test/pdf/CT202211462186-一公院-收入类-采购施工总承包-28页扫描件.pdf\n",
      "|    | 要素名称                 | 要素点   |\n",
      "|---:|:-------------------------|:---------|\n",
      "|  0 | 合同标的_用途_标的物用途 | 无       |\n",
      "|  1 | 合同首部_卖方信息_地址   | 无       |\n",
      "|  2 | 日期                     | 无       |\n",
      "|  3 | 合同首部_买方信息_名称   | 无       |\n",
      "[2023/08/30 16:17:07] ppocr DEBUG: dt_boxes num : 36, elapse : 0.5354197025299072\n",
      "[2023/08/30 16:17:07] ppocr DEBUG: cls num  : 36, elapse : 0.19214463233947754\n",
      "[2023/08/30 16:17:14] ppocr DEBUG: rec_res num  : 36, elapse : 6.896073341369629\n",
      "[2023/08/30 16:17:15] ppocr DEBUG: dt_boxes num : 29, elapse : 0.5004010200500488\n",
      "[2023/08/30 16:17:15] ppocr DEBUG: cls num  : 29, elapse : 0.15157365798950195\n",
      "[2023/08/30 16:17:22] ppocr DEBUG: rec_res num  : 29, elapse : 7.074715614318848\n",
      "[2023/08/30 16:17:23] ppocr DEBUG: dt_boxes num : 53, elapse : 0.5024957656860352\n",
      "[2023/08/30 16:17:23] ppocr DEBUG: cls num  : 53, elapse : 0.2815513610839844\n",
      "[2023/08/30 16:17:27] ppocr DEBUG: rec_res num  : 53, elapse : 4.392639636993408\n",
      "./标书实体抽取挑战赛公开数据/test/pdf/CT202311331222-中国城乡-收入类-赔偿、补偿类合同-7页扫描件.pdf\n",
      "|    | 要素名称                      | 要素点                                               |\n",
      "|---:|:------------------------------|:-----------------------------------------------------|\n",
      "|  0 | 合同尾部_卖方信息_名称        | 成都蜀都文化旅游投资发展有限公司                           |\n",
      "|  1 | 合同标的额小写                | ￥100万元                                             |\n",
      "|  2 | 收款方银行信息_账户名称       | 中国市政工程西南设计研究总院有限公司                       |\n",
      "|  3 | 合同尾部_买方信息_联系方式    | 无                                                     |\n",
      "|  4 | 支付时间及方式_支付方式_支付条件  | 选择按支付方式二进行支付                                 |\n",
      "|  5 | 期限_合同期限届满终止条款     | 无                                                     |\n",
      "|  6 | 支付时间及方式_支付方式_支付比例  | 50%                                                   |\n",
      "|  7 | 合同尾部_买方信息_地址        | 无                                                     |\n",
      "|  8 | 生效_生效条件                 | 无                                                     |\n",
      "[2023/08/30 16:18:22] ppocr DEBUG: dt_boxes num : 16, elapse : 0.47739338874816895\n",
      "[2023/08/30 16:18:22] ppocr DEBUG: cls num  : 16, elapse : 0.07843232154846191\n",
      "[2023/08/30 16:18:24] ppocr DEBUG: rec_res num  : 16, elapse : 1.8359246253967285\n",
      "[2023/08/30 16:18:24] ppocr DEBUG: dt_boxes num : 91, elapse : 0.4634244441986084\n",
      "[2023/08/30 16:18:25] ppocr DEBUG: cls num  : 91, elapse : 0.4530942440032959\n",
      "[2023/08/30 16:18:32] ppocr DEBUG: rec_res num  : 91, elapse : 7.035120964050293\n",
      "[2023/08/30 16:18:33] ppocr DEBUG: dt_boxes num : 0, elapse : 0.47585082054138184\n",
      "[2023/08/30 16:18:33] ppocr DEBUG: cls num  : 0, elapse : 0\n",
      "[2023/08/30 16:18:33] ppocr DEBUG: rec_res num  : 0, elapse : 1.430511474609375e-06\n",
      "./标书实体抽取挑战赛公开数据/test/pdf/CT202311405769-二公院-收入类-专业分包合同-106页扫描件.pdf\n",
      "|    | 要素名称                   | 要素点   |\n",
      "|---:|:---------------------------|:---------|\n",
      "|  0 | 开票_买方开票信息_银行账号 |          |\n",
      "|  1 | 合同首部_卖方信息_地址     |          |\n",
      "|  2 | 开票_发票_税率             |          |\n",
      "|  3 | 开票_买方开票信息_地址     |          |\n",
      "|  4 | 开票_发票_类型             |          |\n",
      "|  5 | 合同标的额小写             |          |\n",
      "|  6 | 开票_买方开票信息_发票抬头 |          |\n",
      "|  7 | 合同标的_用途_标的物用途   |          |\n",
      "|  8 | 生效_生效条件              |          |\n",
      "[2023/08/30 16:19:13] ppocr DEBUG: dt_boxes num : 10, elapse : 0.523064374923706\n",
      "[2023/08/30 16:19:13] ppocr DEBUG: cls num  : 10, elapse : 0.0583956241607666\n",
      "[2023/08/30 16:19:15] ppocr DEBUG: rec_res num  : 10, elapse : 1.5174572467803955\n",
      "[2023/08/30 16:19:15] ppocr DEBUG: dt_boxes num : 92, elapse : 0.5053877830505371\n",
      "[2023/08/30 16:19:16] ppocr DEBUG: cls num  : 92, elapse : 0.46439313888549805\n",
      "[2023/08/30 16:19:24] ppocr DEBUG: rec_res num  : 92, elapse : 8.48947262763977\n",
      "[2023/08/30 16:19:25] ppocr DEBUG: dt_boxes num : 53, elapse : 0.4969449043273926\n",
      "[2023/08/30 16:19:25] ppocr DEBUG: cls num  : 53, elapse : 0.26592302322387695\n",
      "[2023/08/30 16:19:31] ppocr DEBUG: rec_res num  : 53, elapse : 5.499025583267212\n",
      "./标书实体抽取挑战赛公开数据/test/pdf/CT202311434115-二公院-收入类-专业分包合同-18页扫描件.pdf\n",
      "【表格最终格式】\n",
      "        |    | 要素名称               | 要素点   |\n",
      "|---:|:-----------------------|:---------|\n",
      "|  0 | 合同首部_卖方信息_名称 |          |\n",
      "|  1 | 合同首部_买方信息_名称 |          |\n",
      "[2023/08/30 16:20:09] ppocr DEBUG: dt_boxes num : 12, elapse : 0.4826338291168213\n",
      "[2023/08/30 16:20:09] ppocr DEBUG: cls num  : 12, elapse : 0.06291389465332031\n",
      "[2023/08/30 16:20:11] ppocr DEBUG: rec_res num  : 12, elapse : 1.7035138607025146\n",
      "[2023/08/30 16:20:12] ppocr DEBUG: dt_boxes num : 22, elapse : 0.4391765594482422\n",
      "[2023/08/30 16:20:12] ppocr DEBUG: cls num  : 22, elapse : 0.11038804054260254\n",
      "[2023/08/30 16:20:15] ppocr DEBUG: rec_res num  : 22, elapse : 3.304778575897217\n",
      "[2023/08/30 16:20:16] ppocr DEBUG: dt_boxes num : 88, elapse : 0.503838062286377\n",
      "[2023/08/30 16:20:16] ppocr DEBUG: cls num  : 88, elapse : 0.4497709274291992\n",
      "[2023/08/30 16:20:24] ppocr DEBUG: rec_res num  : 88, elapse : 7.7595298290252686\n",
      "./标书实体抽取挑战赛公开数据/test/pdf/CT202311464130-机电局-收入类-采购施工总承包-285页扫描件.pdf\n",
      "| 项目名称   | 厦门海隆码头有限公司厦门港海沧港区20#、21#消位6仓库工程装卸工艺系统工程 |\n",
      "| 招标编号   | 港口开发【2023】006号 |\n",
      "| 合同编号   | HL 2023-09k |\n",
      "| 乙方名称   | 中交机电工程局有限公司 |\n",
      "| 项目工期   | 4个月 |\n",
      "| 图纸名称   | 1.形势图<br>2.总平面布置图<br>3.装卸工艺流程图 |\n",
      "| 档案号     | 1.FJ145-W4-33-1/26<br>2.FJ145-W4-33-2/26<br>3.FJ145-W4-33-3/26 |\n",
      "| 要素名称   | 要素点   |\n",
      "|------------|----------|\n",
      "| 装卸工艺布置图       | FJ145-W4-33-4/26      |\n",
      "| 装卸工艺断面图       | FJ145-W4-33-5/26      |\n",
      "| BH1带式输送机延长段布置图 | FJ145-W4-33-6/26      |\n",
      "| BH2带式输送机布置图    | FJ145-W4-33-7/26      |\n",
      "| BH3带式输送机布置图    | FJ145-W4-33-8/26      |\n",
      "| BD5带式输送机布置图    | FJ145-W4-33-9/26      |\n",
      "| BZ带式输送机布置图     | FJ145-W4-33-10/26    |\n",
      "| BH1带式输送机电子皮带秤位置图 | FJ145-W4-33-11/26    |\n",
      "| 采制样系统工艺布置图    | FJ145-W4-33-12/26    |\n",
      "| 6#粮食平房仓仓库中间屋面预留洞布置图       | FJ145-W4-33-13/26    |\n",
      "| 6#粮食平房仓地面卸粮坑布置图       | FJ145-W4-33-14/26    |\n",
      "| 6#粮食平房仓卸梁坑详图       | FJ145-W4-33-15/26    |\n",
      "| 供电平面图       | FJ145-W4-33-16/26    |\n",
      "| 高压系统图       | FJ145-W4-33-17/26    |\n",
      "| 低压系统图一       | FJ145-W4-33-18/26    |\n",
      "| 低压系统图二       | FJ145-W4-33-19/26    |\n",
      "| 低压系统图三           | FJ145-W4-33-20/26   |\n",
      "| 控制系统图             | FJ145-W4-33-21/26   |\n",
      "| 视频监控系统图          | FJ145-W4-33-22/26   |\n",
      "| 6#粮食平房仓通风设计说明及材料表 | FJ145-W4-33-23/26   |\n",
      "| 6#粮食平房仓通风设备平面布置图 | FJ145-W4-33-24/26   |\n",
      "| 除尘流程图             | FJ145-W4-33-25/26   |\n",
      "| 室外动力管网            | FJ145-W4-33-26/26   |\n",
      "| 压缩空气管网平面图        | 285                   |\n",
      "[2023/08/30 16:21:34] ppocr DEBUG: dt_boxes num : 35, elapse : 0.5339095592498779\n",
      "[2023/08/30 16:21:35] ppocr DEBUG: cls num  : 35, elapse : 0.18477869033813477\n",
      "[2023/08/30 16:21:40] ppocr DEBUG: rec_res num  : 35, elapse : 5.710685729980469\n",
      "[2023/08/30 16:21:41] ppocr DEBUG: dt_boxes num : 21, elapse : 0.4910297393798828\n",
      "[2023/08/30 16:21:41] ppocr DEBUG: cls num  : 21, elapse : 0.11367392539978027\n",
      "[2023/08/30 16:21:46] ppocr DEBUG: rec_res num  : 21, elapse : 4.858500003814697\n",
      "[2023/08/30 16:21:46] ppocr DEBUG: dt_boxes num : 32, elapse : 0.49378085136413574\n",
      "[2023/08/30 16:21:47] ppocr DEBUG: cls num  : 32, elapse : 0.17016315460205078\n",
      "[2023/08/30 16:21:52] ppocr DEBUG: rec_res num  : 32, elapse : 5.602962017059326\n",
      "./标书实体抽取挑战赛公开数据/test/pdf/CT202311465575-四航局-收入类-其他工程类合同-12页扫描件.pdf\n",
      "|    | 要素名称               | 要素点   |\n",
      "|---:|:-----------------------|:---------|\n",
      "|  0 | 开票_发票_税率         |          |\n",
      "|  1 | 开票_发票_发票类型     |          |\n",
      "|  2 | 合同首部_卖方信息_名称 |          |\n",
      "|  3 | 合同标的额小写         |          |\n",
      "|  4 | 合同首部_买方信息_名称 |          |\n",
      "[2023/08/30 16:22:18] ppocr DEBUG: dt_boxes num : 38, elapse : 0.5318832397460938\n",
      "[2023/08/30 16:22:18] ppocr DEBUG: cls num  : 38, elapse : 0.19514179229736328\n",
      "[2023/08/30 16:22:23] ppocr DEBUG: rec_res num  : 38, elapse : 4.98461389541626\n",
      "[2023/08/30 16:22:24] ppocr DEBUG: dt_boxes num : 25, elapse : 0.487241268157959\n",
      "[2023/08/30 16:22:24] ppocr DEBUG: cls num  : 25, elapse : 0.12900948524475098\n",
      "[2023/08/30 16:22:29] ppocr DEBUG: rec_res num  : 25, elapse : 5.045867681503296\n",
      "[2023/08/30 16:22:30] ppocr DEBUG: dt_boxes num : 35, elapse : 0.48694276809692383\n",
      "[2023/08/30 16:22:30] ppocr DEBUG: cls num  : 35, elapse : 0.17696547508239746\n",
      "[2023/08/30 16:22:33] ppocr DEBUG: rec_res num  : 35, elapse : 3.0128071308135986\n",
      "./标书实体抽取挑战赛公开数据/test/pdf/CT202311466757-中国城乡-收入类-其他工程类合同-7页扫描件.pdf\n",
      "        【表格最终格式】\n",
      "        |    | 要素名称               | 要素点        |\n",
      "|---:|:-----------------------|:------------|\n",
      "|  0 | 合同标的额大写         |          |\n",
      "|  1 | 开票_发票_税率         |          |\n",
      "|  2 | 开票_发票_类型         |          |\n",
      "|  3 | 合同首部_买方信息_名称 |          |\n",
      "[2023/08/30 16:22:59] ppocr DEBUG: dt_boxes num : 14, elapse : 0.47649598121643066\n",
      "[2023/08/30 16:22:59] ppocr DEBUG: cls num  : 14, elapse : 0.07173943519592285\n",
      "[2023/08/30 16:23:01] ppocr DEBUG: rec_res num  : 14, elapse : 1.1344094276428223\n",
      "[2023/08/30 16:23:01] ppocr DEBUG: dt_boxes num : 28, elapse : 0.4479639530181885\n",
      "[2023/08/30 16:23:01] ppocr DEBUG: cls num  : 28, elapse : 0.13824868202209473\n",
      "[2023/08/30 16:23:06] ppocr DEBUG: rec_res num  : 28, elapse : 4.9739460945129395\n",
      "[2023/08/30 16:23:07] ppocr DEBUG: dt_boxes num : 33, elapse : 0.46778082847595215\n",
      "[2023/08/30 16:23:07] ppocr DEBUG: cls num  : 33, elapse : 0.1604907512664795\n",
      "[2023/08/30 16:23:09] ppocr DEBUG: rec_res num  : 33, elapse : 2.3316123485565186\n",
      "./标书实体抽取挑战赛公开数据/test/pdf/TMHT001-建设项目工程总承包合同.pdf\n",
      "|    | 要素名称                   | 要素点   |\n",
      "|---:|:---------------------------|:---------|\n",
      "|  0 | 合同正文_签订日期值        |          |\n",
      "|  1 | 合同尾部_买方信息_联系方式 |          |\n",
      "|  2 | 生效_生效条件              |          |\n"
     ]
    }
   ],
   "source": [
    "for pdf_path, label_path in zip(test_pdf[3:], test_label[3:]):\n",
    "    \n",
    "    # 步骤1：读取待提取的信息\n",
    "    df = pd.read_excel(label_path)\n",
    "    df['要素点'] = ''\n",
    "    \n",
    "    # 步骤2：提取pdf内容\n",
    "    pages = convert_from_path(pdf_path, 200)\n",
    "    pages = [pages[0], pages[1], pages[-1]]\n",
    "    content = ''\n",
    "    for count, page in enumerate(pages):\n",
    "        page.save(f'out.jpg', 'JPEG')\n",
    "\n",
    "        result = ocr.ocr('out.jpg', cls=True)\n",
    "        for idx in range(len(result)):\n",
    "            res = result[idx]\n",
    "            for line in res:\n",
    "                content += line[1][0] + '\\n'\n",
    "\n",
    "        content += '\\n'\n",
    "    \n",
    "    # 步骤3：将pdf内容分页提取\n",
    "    url = \"https://oa.api2d.site/v1/chat/completions\"\n",
    "    headers = {\n",
    "        'Content-Type': 'application/json',    \n",
    "        'Authorization': 'Bearer 替换为你的api-key',\n",
    "    }\n",
    "\n",
    "    table_extract_result = []\n",
    "    total_page = len(content.split('\\n'))\n",
    "    for idx in range(total_page // 50 + 1):\n",
    "        input_content = '\\n'.join(content.split('\\n')[idx*50:(idx+1)*50])\n",
    "\n",
    "        data = {\n",
    "            \"model\": \"gpt-3.5-turbo\",\n",
    "\n",
    "            \"messages\": [{\"role\": \"user\", \"content\": \n",
    "            f\"\"\"\n",
    "            【任务】帮我从内容中提取信息，填充下面的表格，如果无法填充，则填无。只需要输出待填充表格。\n",
    "\n",
    "            【输入信息】\n",
    "            {input_content}\n",
    "\n",
    "            【待填充表格内容】\n",
    "            {df.to_markdown()}\n",
    "            \"\"\"}]\n",
    "        }\n",
    "\n",
    "        response = requests.post(url, headers=headers, json=data)\n",
    "        table_extract_result.append(response.json()['choices'][0]['message']['content'])\n",
    "    \n",
    "    # 步骤4：将最终结果汇总为最终格式\n",
    "    table_extract_result = '\\n\\n'.join(table_extract_result)\n",
    "\n",
    "    data = {\n",
    "        \"model\": \"gpt-3.5-turbo\",\n",
    "        \"messages\": [{\"role\": \"user\", \"content\": \n",
    "        f\"\"\"\n",
    "        【任务】帮将表格信息进行合并，只需要输出待填充表格。\n",
    "\n",
    "        【输入信息】\n",
    "        {table_extract_result}\n",
    "\n",
    "        【表格最终格式】\n",
    "        {df.to_markdown()}\n",
    "        \"\"\"}]\n",
    "    }\n",
    "\n",
    "    response = requests.post(url, headers=headers, json=data)\n",
    "    \n",
    "    print(pdf_path)\n",
    "    print(response.json()['choices'][0]['message']['content'])\n",
    "    \n",
    "    try:\n",
    "        pd.read_csv(\n",
    "            StringIO(response.json()['choices'][0]['message']['content'].replace(' ', '')),  # Get rid of whitespaces\n",
    "            sep='|',\n",
    "            index_col=1\n",
    "        ).dropna(\n",
    "            axis=1,\n",
    "            how='all'\n",
    "        ).iloc[1:]['要素点'].to_csv('./submit/' + pdf_path.split('/')[-1][:-4] + '.csv', index=None, header=None)\n",
    "    except:\n",
    "        pass"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 101,
   "id": "cb8afd2a-7b65-40f2-a9f7-ac4a21e373a1",
   "metadata": {
    "tags": []
   },
   "outputs": [],
   "source": [
    "!\\rm -rf ./submit/.ipynb_checkpoints/"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 102,
   "id": "773e2176-f5d5-4835-8e7e-dad41254df07",
   "metadata": {
    "tags": []
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "  adding: submit/ (stored 0%)\n",
      "  adding: submit/CT201710984626-中交建筑-收入类-内部任务书-4页扫描件.csv (deflated 74%)\n",
      "  adding: submit/CT201411033436-信科集团-支出类-设备 (含船机)购销合同-28页扫描件.csv (deflated 71%)\n",
      "  adding: submit/CT201111215740-民航机场建设集团-支出类-设计合同-8页扫描件.csv (deflated 23%)\n",
      "  adding: submit/CT202110629429-四航局-收入类-赔偿、补偿类合同-3页扫描件.csv (deflated 67%)\n",
      "  adding: submit/CT202211297356-一航局-收入类-设计施工总承包合同-34页扫描件.csv (stored 0%)\n",
      "  adding: submit/CT202311405769-二公院-收入类-专业分包合同-106页扫描件.csv (deflated 74%)\n",
      "  adding: submit/CT201310863030-民航机场建设集团-支出类-专业分包合同-23页扫描件.csv (deflated 67%)\n",
      "  adding: submit/CT201810217655-一航局-收入类-专业分包合同-68页扫描件.csv (stored 0%)\n",
      "  adding: submit/CT202110330559-三航局-收入类-赔偿、补偿类合同-3页扫描件.csv (deflated 71%)\n",
      "  adding: submit/CT201311324586-中交建筑-支出类-劳务分包合同-33页扫描件.csv (deflated 22%)\n",
      "  adding: submit/CT201210918007-一公局-支出类-专业分包合同-26页扫描件.csv (deflated 53%)\n",
      "  adding: submit/CT202311466757-中国城乡-收入类-其他工程类合同-7页扫描件.csv (stored 0%)\n",
      "  adding: submit/CT202211460211-四航局-收入类-设计施工采购总承包合同-27页扫描件.csv (deflated 15%)\n",
      "  adding: submit/CT201410957473-中交疏浚-支出类-专业分包合同-10页扫描件.csv (deflated 61%)\n",
      "  adding: submit/CT201110576783-一公院-支出类-设计合同-7页扫描件.csv (deflated 71%)\n",
      "  adding: submit/CT201310177080-一航局-支出类-劳务分包合同-28页扫描件.csv (deflated 22%)\n",
      "  adding: submit/CT201411316563-中交建筑-收入类-施工（总）承包-6页扫描件.csv (deflated 79%)\n",
      "  adding: submit/CT201110704238-一公院-支出类-设备 (含船机)购销合同-7页扫描件.csv (deflated 7%)\n",
      "  adding: submit/TMHT001-建设项目工程总承包合同.csv (deflated 22%)\n",
      "  adding: submit/CT201210212814-一航局-支出类-专业分包合同-30页扫描件.csv (stored 0%)\n",
      "  adding: submit/CT201410925185-一公局-支出类-物资购销合同-5页模糊扫描件.csv (deflated 18%)\n",
      "  adding: submit/CT202311331222-中国城乡-收入类-赔偿、补偿类合同-7页扫描件.csv (deflated 11%)\n",
      "  adding: submit/CT200810475234-中交建筑-支出类-劳务分包合同-21页扫描件.csv (deflated 11%)\n",
      "  adding: submit/CT202211462186-一公院-收入类-采购施工总承包-28页扫描件.csv (deflated 44%)\n",
      "  adding: submit/CT201810171842-中交路建-收入类-赔偿、补偿类合同-4页扫描件.csv (deflated 41%)\n",
      "  adding: submit/CT201410581136-三公局-支出类-劳务分包合同-45页扫描件.csv (deflated 42%)\n",
      "  adding: submit/CT202311464130-机电局-收入类-采购施工总承包-285页扫描件.csv (stored 0%)\n",
      "  adding: submit/CT201210917910-一公局-支出类-专业分包合同-15页扫描件.csv (deflated 38%)\n",
      "  adding: submit/CT201011166974-信科集团-支出类-物资购销合同-40页扫描件.csv (deflated 67%)\n",
      "  adding: submit/CT201410736682-中交房地产-支出类-专业分包合同-65页扫描件.csv (stored 0%)\n",
      "  adding: submit/CT202311434115-二公院-收入类-专业分包合同-18页扫描件.csv (stored 0%)\n",
      "  adding: submit/CT201210455567-一航局-支出类-设备 (含船机)购销合同-8页扫描件.csv (stored 0%)\n",
      "  adding: submit/CT201710190380-一航局-收入类-设计施工总承包合同-85页扫描件.csv (stored 0%)\n",
      "  adding: submit/CT201310562425-中交建筑-支出类-劳务分包合同-13页扫描件.csv (deflated 39%)\n",
      "  adding: submit/CT201811444794-四航局-收入类-采购施工总承包-6页扫描件.csv (deflated 7%)\n",
      "  adding: submit/CT201711459614-中交疏浚-收入类-设计施工总承包合同-31页扫描件.csv (stored 0%)\n",
      "  adding: submit/CT201411334205-四航局-支出类-劳务分包合同-17页扫描件.csv (deflated 17%)\n",
      "  adding: submit/CT200810050037-中国城乡-支出类-设计合同-9页扫描件.csv (stored 0%)\n",
      "  adding: submit/CT201411131833-一公院-支出类-设备 (含船机)购销合同-10页扫描件.csv (deflated 43%)\n",
      "  adding: submit/CT202010023734-二公院-收入类-设计施工总承包合同-36页扫描件.csv (deflated 61%)\n",
      "  adding: submit/CT202211379269-四航局-收入类-采购施工总承包-92页扫描件.csv (deflated 71%)\n",
      "  adding: submit/CT201211133943-一航局-支出类-设备 (含船机)购销合同-28页扫描件.csv (deflated 53%)\n",
      "  adding: submit/CT201511143732-西筑公司-收入类-劳务分包合同-5页扫描件.csv (deflated 42%)\n",
      "  adding: submit/CT201210928685-三公局-支出类-物资购销合同-4页扫描件.csv (deflated 29%)\n",
      "  adding: submit/CT201011002502-上海振华重工-支出类-设备 (含船机)购销合同-12页扫描件.csv (deflated 22%)\n",
      "  adding: submit/CT201611379239-中国城乡-收入类-其他工程类合同-5页扫描件.csv (deflated 67%)\n",
      "  adding: submit/CT201711260968-四航局-收入类-设计施工采购总承包合同-150页扫描件.csv (deflated 5%)\n",
      "  adding: submit/CT201311302717-民航机场建设集团-支出类-设计合同-8页扫描件.csv (stored 0%)\n",
      "  adding: submit/CT201311207591-中资集团-支出类-设计合同-11页扫描件.csv (deflated 22%)\n",
      "  adding: submit/CT202311465575-四航局-收入类-其他工程类合同-12页扫描件.csv (deflated 53%)\n"
     ]
    }
   ],
   "source": [
    "!zip -r submit.zip submit"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "0d90f7ee-fd8d-4ba1-8b2b-a8393489bd66",
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3.10"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.9.10"
  },
  "widgets": {
   "application/vnd.jupyter.widget-state+json": {
    "state": {},
    "version_major": 2,
    "version_minor": 0
   }
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
